Moore-Language-Space-ZeroGPU

Sleeping

App Files Files Community

ANYANTUDRE commited on Oct 22, 2024

Commit

5966f2d

1 Parent(s): f9ec5b7

fixed small bugs

Browse files

Files changed (3) hide show

app.py +6 -9
goai_helpers/goai_stt_ttt_pipeline.py +8 -11
goai_helpers/goai_ttt_tts_pipeline.py +2 -3

app.py CHANGED Viewed

@@ -2,7 +2,7 @@ import gradio as gr
 from huggingface_hub import login
 import os
-from languages import get_language_names
 from goai_helpers import goai_traduction, goai_stt, goai_stt2, goai_tts,  goai_tts2, goai_ttt_tts_pipeline, goai_stt_ttt_pipeline
 auth_token = os.getenv('HF_SPACE_TOKEN')
@@ -12,8 +12,8 @@ login(token=auth_token)
 # list all files in the ./audios directory for the dropdown
 AUDIO_FILES = [f for f in os.listdir('./exples_voix') if os.path.isfile(os.path.join('./exples_voix', f))]
 MODELES_TTS = ["ArissBandoss/coqui-tts-moore-V1", "ArissBandoss/mms-tts-mos-V18"]
-MODELES_ASR = ["ArissBandoss/whisper-small-mos"]
-LANGUAGES  = ["Automatic Detection"]
 DESCRIPTION = """<div style="display: flex; justify-content: space-between; align-items: center; flex-wrap: wrap;">
                     <div style="flex: 1; min-width: 250px;">
@@ -25,7 +25,7 @@ DESCRIPTION = """<div style="display: flex; justify-content: space-between; alig
                         <img src="https://github.com/ANYANTUDRE/Stage-IA-Selever-GO-AI-Corp/blob/main/img/goaicorp-logo2.jpg?raw=true" width="300px" style="max-width: 100%; height: auto;">
                     </div>
                 </div>
-                """
 demo = gr.Blocks(theme=gr.themes.Soft())
@@ -53,10 +53,7 @@ goai_stt_if = gr.Interface(
     inputs=[
         gr.Audio(sources=["microphone", "upload"], type="filepath"),
         gr.Dropdown(
-            choices=[
-                "ArissBandoss/whisper-small-mos",
-                "openai/whisper-large-v3-turbo",
-            ],
             value="ArissBandoss/whisper-small-mos",
             label="Model Name"
         ),
@@ -128,7 +125,7 @@ goai_stt_ttt_pipeline_if = gr.Interface(
         gr.Dropdown(
             label="Modèles d'ASR",
             choices=MODELES_ASR,
-            value="Automatic Detection"
         ),
         gr.Dropdown(
             choices=LANGUAGES,

 from huggingface_hub import login
 import os
+#from languages import get_language_names
 from goai_helpers import goai_traduction, goai_stt, goai_stt2, goai_tts,  goai_tts2, goai_ttt_tts_pipeline, goai_stt_ttt_pipeline
 auth_token = os.getenv('HF_SPACE_TOKEN')
 # list all files in the ./audios directory for the dropdown
 AUDIO_FILES = [f for f in os.listdir('./exples_voix') if os.path.isfile(os.path.join('./exples_voix', f))]
 MODELES_TTS = ["ArissBandoss/coqui-tts-moore-V1", "ArissBandoss/mms-tts-mos-V18"]
+MODELES_ASR = ["ArissBandoss/whisper-small-mos", "openai/whisper-large-v3-turbo"]
+LANGUAGES   = ["Automatic Detection"]
 DESCRIPTION = """<div style="display: flex; justify-content: space-between; align-items: center; flex-wrap: wrap;">
                     <div style="flex: 1; min-width: 250px;">
                         <img src="https://github.com/ANYANTUDRE/Stage-IA-Selever-GO-AI-Corp/blob/main/img/goaicorp-logo2.jpg?raw=true" width="300px" style="max-width: 100%; height: auto;">
                     </div>
                 </div>
+            """
 demo = gr.Blocks(theme=gr.themes.Soft())
     inputs=[
         gr.Audio(sources=["microphone", "upload"], type="filepath"),
         gr.Dropdown(
+            choices=MODELES_ASR,
             value="ArissBandoss/whisper-small-mos",
             label="Model Name"
         ),
         gr.Dropdown(
             label="Modèles d'ASR",
             choices=MODELES_ASR,
+            value="ArissBandoss/whisper-small-mos",
         ),
         gr.Dropdown(
             choices=LANGUAGES,

goai_helpers/goai_stt_ttt_pipeline.py CHANGED Viewed

@@ -9,29 +9,26 @@ from goai_helpers.goai_stt2 import transcribe
 auth_token = os.getenv('HF_SPACE_TOKEN')
 login(token=auth_token)
-MODEL_ASR = "ArissBandoss/whisper-small-mos"
-LANGUAGE  = "Automatic Detection"
 # gradio interface translation and text to speech function
 @spaces.GPU(duration=120)
 def goai_stt_ttt(
-        inputs,
         batch_size,
         chunk_length_s,
-        stride_length_s,
-        model=MODEL_ASR,
-        language=LANGUAGE,
     ):
     # 1. STT: Speech To Text
     mos_text = transcribe(
-        inputs,
         batch_size,
         chunk_length_s,
-        stride_length_s,
-        model=model,
-        language=language,
     )
     yield mos_text, None

 auth_token = os.getenv('HF_SPACE_TOKEN')
 login(token=auth_token)
 # gradio interface translation and text to speech function
 @spaces.GPU(duration=120)
 def goai_stt_ttt(
+        inputs,
+        model,
+        language,
         batch_size,
         chunk_length_s,
+        stride_length_s
     ):
     # 1. STT: Speech To Text
     mos_text = transcribe(
+        inputs,
+        model,
+        language,
         batch_size,
         chunk_length_s,
+        stride_length_s
     )
     yield mos_text, None

goai_helpers/goai_ttt_tts_pipeline.py CHANGED Viewed

@@ -1,5 +1,4 @@
 import os
-import torch
 import spaces
 from huggingface_hub import login
@@ -33,11 +32,11 @@ def goai_many_tts(
         else:
             audio_array, sampling_rate = text_to_speech(tts, text, reference_speaker=reference_speaker)
-        return text, (sampling_rate, audio_array.numpy())
     elif tts_model == "ArissBandoss/mms-tts-mos-V18":
         sample_rate, audio_data = goai_tts(text)
-        return text, (sample_rate, audio_data)
     else:
         print("Erreur de modèle!!! Veuillez vérifier le modèle sélectionné.")

 import os
 import spaces
 from huggingface_hub import login
         else:
             audio_array, sampling_rate = text_to_speech(tts, text, reference_speaker=reference_speaker)
+        return sampling_rate, audio_array.numpy()
     elif tts_model == "ArissBandoss/mms-tts-mos-V18":
         sample_rate, audio_data = goai_tts(text)
+        return sample_rate, audio_data
     else:
         print("Erreur de modèle!!! Veuillez vérifier le modèle sélectionné.")