Spaces:

DeepLearning101
/

ASR-ANNOTATION

Sleeping

App Files Files Community

DeepLearning101 commited on Apr 30, 2024

Commit

7094a64

verified ·

1 Parent(s): b851f75

Update app.py

Browse files

Files changed (1) hide show

app.py +4 -15

app.py CHANGED Viewed

@@ -3,33 +3,23 @@ import gradio as gr
 import whisper
 import os
 # 加載 Whisper 模型
 model = whisper.load_model("large-v2", device="cuda" if torch.cuda.is_available() else "cpu")
 def transcribe(audio_file):
-    # 從 Gradio 文件輸入獲取文件路徑
     audio_path = audio_file
-    # 使用 Whisper 進行語音識別
     result = model.transcribe(audio_path)
     text = result["text"]
-    # 提取上載的音頻文件的基本名字，用作保存轉錄文本的文件名
     base_name = os.path.splitext(os.path.basename(audio_path))[0]
-    # 定義保存轉錄結果的文件路徑
     transcript_file_path = f"txt/{base_name}_transcript.txt"
-    # 確保 txt 目錄存在
     os.makedirs("txt", exist_ok=True)
-    # 將轉錄文本保存到文件
     with open(transcript_file_path, "w") as file:
         file.write(text)
-    # 返回文本和文件路徑，使得文件可以在界麵上下載
     return text, transcript_file_path
-# 創建 Gradio 界麵
 with gr.Blocks(css=".container { max-width: 800px; margin: auto; } .gradio-app { background-color: #f0f0f0; } button { background-color: #4CAF50; color: white; }") as demo:
     gr.Markdown("ASR 語音語料辨識修正工具")
     with gr.Row():
@@ -37,7 +27,6 @@ with gr.Blocks(css=".container { max-width: 800px; margin: auto; } .gradio-app {
         submit_button = gr.Button("語音識別")
     output_text = gr.TextArea(label="識別結果")
     download_link = gr.File(label="下載轉錄文件")
     submit_button.click(fn=transcribe, inputs=audio_input, outputs=[output_text, download_link])
-demo.launch()

 import whisper
 import os
+# 確保 Whisper 模塊被正確加載
+print("Whisper module contents:", dir(whisper))
 # 加載 Whisper 模型
 model = whisper.load_model("large-v2", device="cuda" if torch.cuda.is_available() else "cpu")
 def transcribe(audio_file):
     audio_path = audio_file
     result = model.transcribe(audio_path)
     text = result["text"]
     base_name = os.path.splitext(os.path.basename(audio_path))[0]
     transcript_file_path = f"txt/{base_name}_transcript.txt"
     os.makedirs("txt", exist_ok=True)
     with open(transcript_file_path, "w") as file:
         file.write(text)
     return text, transcript_file_path
 with gr.Blocks(css=".container { max-width: 800px; margin: auto; } .gradio-app { background-color: #f0f0f0; } button { background-color: #4CAF50; color: white; }") as demo:
     gr.Markdown("ASR 語音語料辨識修正工具")
     with gr.Row():
         submit_button = gr.Button("語音識別")
     output_text = gr.TextArea(label="識別結果")
     download_link = gr.File(label="下載轉錄文件")
     submit_button.click(fn=transcribe, inputs=audio_input, outputs=[output_text, download_link])
+demo.launch()