badassgi

Running

App Files Files Community

openfree commited on Oct 22, 2024

Commit

d8083da

verified ·

1 Parent(s): 3291a15

Update app.py

Browse files

Files changed (1) hide show

app.py +58 -35

app.py CHANGED Viewed

@@ -1,10 +1,8 @@
 import spaces
-import torch
 import gradio as gr
 from transformers import pipeline
 from huggingface_hub import InferenceClient
-import tempfile
 import os
 MODEL_NAME = "openai/whisper-large-v3-turbo"
@@ -13,6 +11,7 @@ FILE_LIMIT_MB = 1000
 device = 0 if torch.cuda.is_available() else "cpu"
 pipe = pipeline(
     task="automatic-speech-recognition",
     model=MODEL_NAME,
@@ -20,64 +19,88 @@ pipe = pipeline(
     device=device,
 )
-# Hugging Face InferenceClient 사용
-hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus-08-2024", token=os.getenv("HF_TOKEN"))
 @spaces.GPU
-def transcribe_summarize(inputs, task):
-    if inputs is None:
         raise gr.Error("오디오 파일이 제출되지 않았습니다! 요청을 제출하기 전에 오디오 파일을 업로드하거나 녹음해 주세요.")
     # 음성을 텍스트로 변환
-    text = pipe(inputs, batch_size=BATCH_SIZE, generate_kwargs={"task": task}, return_timestamps=True)["text"]
-    # 변환된 텍스트 요약 요청
     try:
-        summary = hf_client.summarization(text)
-        summary_text = summary["summary_text"] if summary and "summary_text" in summary else "요약할 수 없습니다."
     except Exception as e:
-        summary_text = f"요약 중 오류가 발생했습니다: {e}"
-    return {
-        "transcribed_text": text,
-        "summary": summary_text
-    }
 css = """
-footer {
-    visibility: hidden;
-}
 """
 file_transcribe = gr.Interface(
     fn=transcribe_summarize,
     inputs=[
         gr.Audio(sources="upload", type="filepath", label="오디오 파일"),
-        gr.Radio(["transcribe", "translate"], label="작업", value="transcribe"),
     ],
-    outputs=["text", "text"],  # 변환된 텍스트, 요약 출력
-    title="받아쓰기 AI: 음성을 텍스트 변환, 요약 자동 생성",
-    flagging_mode="never",
 )
-mf_transcribe = gr.Interface(css=css,
     fn=transcribe_summarize,
     inputs=[
         gr.Audio(sources="microphone", type="filepath"),
-        gr.Radio(["transcribe", "translate"], label="작업", value="transcribe"),
     ],
-    outputs=["text", "text"],  # 변환된 텍스트, 요약 출력
-    title="받아쓰기 AI: 음성을 텍스트 변환, 요약 자동 생성",
     flagging_mode="never",
 )
-# demo 변수를 Gradio Blocks 컨테이너로 정의
 demo = gr.Blocks(theme="Nymbo/Nymbo_Theme")
-# 탭 순서를 "오디오 파일"이 먼저, "마이크"가 뒤에 오도록 설정
 with demo:
-    gr.TabbedInterface([file_transcribe, mf_transcribe], ["오디오 파일", "마이크"])
-demo.queue().launch(ssr_mode=False)

 import spaces
+import torch
 import gradio as gr
 from transformers import pipeline
 from huggingface_hub import InferenceClient
 import os
 MODEL_NAME = "openai/whisper-large-v3-turbo"
 device = 0 if torch.cuda.is_available() else "cpu"
+# Whisper 파이프라인 초기화
 pipe = pipeline(
     task="automatic-speech-recognition",
     model=MODEL_NAME,
     device=device,
 )
+# Hugging Face 추론 클라이언트 설정
+hf_client = InferenceClient(
+    "CohereForAI/c4ai-command-r-plus-08-2024",
+    token=os.getenv("HF_TOKEN")
+)
 @spaces.GPU
+def transcribe_summarize(audio_input, task):
+    # 입력 검증
+    if audio_input is None:
         raise gr.Error("오디오 파일이 제출되지 않았습니다! 요청을 제출하기 전에 오디오 파일을 업로드하거나 녹음해 주세요.")
     # 음성을 텍스트로 변환
+    result = pipe(
+        audio_input,
+        batch_size=BATCH_SIZE,
+        generate_kwargs={"task": task},
+        return_timestamps=True
+    )
+    transcribed_text = result["text"]
+    # 텍스트 요약
     try:
+        summary = hf_client.summarization(transcribed_text)
+        summary_text = summary.get("summary_text", "요약할 수 없습니다.")
     except Exception as e:
+        summary_text = f"요약 중 오류가 발생했습니다: {str(e)}"
+    # 결과를 리스트로 반환
+    return [transcribed_text, summary_text]
+# CSS 스타일
 css = """
+footer { visibility: hidden; }
 """
+# 파일 업로드 인터페이스
 file_transcribe = gr.Interface(
     fn=transcribe_summarize,
     inputs=[
         gr.Audio(sources="upload", type="filepath", label="오디오 파일"),
+        gr.Radio(
+            choices=["transcribe", "translate"],
+            label="작업",
+            value="transcribe"
+        ),
     ],
+    outputs=[
+        gr.Textbox(label="변환된 텍스트"),
+        gr.Textbox(label="요약")
+    ],
+    title="받아쓰기 AI: 음성을 텍스트로 변환하고 요약하기",
+    flagging_mode="never"
 )
+# 마이크 녹음 인터페이스
+mic_transcribe = gr.Interface(
     fn=transcribe_summarize,
     inputs=[
         gr.Audio(sources="microphone", type="filepath"),
+        gr.Radio(
+            choices=["transcribe", "translate"],
+            label="작업",
+            value="transcribe"
+        ),
+    ],
+    outputs=[
+        gr.Textbox(label="변환된 텍스트"),
+        gr.Textbox(label="요약")
     ],
+    title="받아쓰기 AI: 음성을 텍스트로 변환하고 요약하기",
     flagging_mode="never",
+    css=css
 )
+# 메인 애플리케이션
 demo = gr.Blocks(theme="Nymbo/Nymbo_Theme")
 with demo:
+    gr.TabbedInterface(
+        [file_transcribe, mic_transcribe],
+        ["오디오 파일", "마이크"]
+    )
+# 애플리케이션 실행
+demo.queue().launch(ssr_mode=False)