Live-Podcast

Running on Zero

App Files Files Community

openfree commited on 17 days ago

Commit

db70ad9

verified ·

1 Parent(s): 99fb44e

Update app-backup.py

Browse files

Files changed (1) hide show

app-backup.py +24 -135

app-backup.py CHANGED Viewed

@@ -249,69 +249,6 @@ class UnifiedAudioConverter:
             {"role": "user", "content": self._build_prompt(text, language)}
         ]
-    @spaces.GPU(duration=120)
-    def translate_to_korean(self, conversation_json: Dict) -> Dict:
-        """Translate English conversation to Korean using local LLM"""
-        try:
-            self.initialize_local_mode()
-            chat_template = self._get_messages_formatter_type(self.config.local_model_name)
-            provider = LlamaCppPythonProvider(self.local_llm)
-            system_message = """당신은 전문 번역가입니다. 영어 팟캐스트 대화를 자연스러운 한국어 구어체로 번역해주세요.
-            한국적 표현을 사용하고, 팟캐스트에 적합한 친근하고 자연스러운 말투로 번역하세요.
-            전문 용어는 한국어로 적절히 의역하거나 설명을 추가하세요. JSON 형식을 유지하세요."""
-            agent = LlamaCppAgent(
-                provider,
-                system_prompt=system_message,
-                predefined_messages_formatter_type=chat_template,
-                debug_output=False
-            )
-            settings = provider.get_provider_default_settings()
-            settings.temperature = 0.7
-            settings.top_k = 40
-            settings.top_p = 0.95
-            settings.max_tokens = 2048
-            settings.repeat_penalty = 1.1
-            settings.stream = False
-            messages = BasicChatHistory()
-            # 번역할 대화를 JSON 문자열로 변환
-            conversation_str = json.dumps(conversation_json, ensure_ascii=False, indent=2)
-            prompt = f"""다음 영어 팟캐스트 대화를 자연스러운 한국어 구어체로 번역해주세요.
-            한국적 표현과 친근한 말투를 사용하고, JSON 형식을 그대로 유지하세요:
-            {conversation_str}
-            번역된 결과를 JSON 형식으로만 반환해주세요."""
-            response = agent.get_chat_response(
-                prompt,
-                llm_sampling_settings=settings,
-                chat_history=messages,
-                returns_streaming_generator=False,
-                print_output=False
-            )
-            # JSON 파싱
-            pattern = r"\{(?:[^{}]|(?:\{[^{}]*\}))*\}"
-            json_match = re.search(pattern, response)
-            if json_match:
-                translated_json = json.loads(json_match.group())
-                return translated_json
-            else:
-                print("번역 실패, 원본 반환")
-                return conversation_json
-        except Exception as e:
-            print(f"번역 중 오류 발생: {e}, 원본 반환")
-            return conversation_json
     @spaces.GPU(duration=120)
     def extract_conversation_local(self, text: str, language: str = "English", progress=None) -> Dict:
         """Extract conversation using new local LLM (primary method)"""
@@ -322,8 +259,11 @@ class UnifiedAudioConverter:
             chat_template = self._get_messages_formatter_type(self.config.local_model_name)
             provider = LlamaCppPythonProvider(self.local_llm)
-            # 영어로 대화 생성 (일단 영어로 생성하고 한국어 선택시 번역)
-            system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations. Respond only in JSON format."
             agent = LlamaCppAgent(
                 provider,
@@ -342,8 +282,7 @@ class UnifiedAudioConverter:
             messages = BasicChatHistory()
-            # 영어 프롬프트로 생성
-            prompt = self._build_prompt(text, "English")
             response = agent.get_chat_response(
                 prompt,
                 llm_sampling_settings=settings,
@@ -357,14 +296,7 @@ class UnifiedAudioConverter:
             json_match = re.search(pattern, response)
             if json_match:
-                conversation_json = json.loads(json_match.group())
-                # 한국어가 선택된 경우 번역 수행
-                if language == "Korean":
-                    print("한국어 번역 중...")
-                    conversation_json = self.translate_to_korean(conversation_json)
-                return conversation_json
             else:
                 raise ValueError("No valid JSON found in local LLM response")
@@ -378,12 +310,15 @@ class UnifiedAudioConverter:
         try:
             self.initialize_legacy_local_mode()
-            # 영어로 대화 생성
-            system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations."
             chat = [
                 {"role": "system", "content": system_message},
-                {"role": "user", "content": self._build_prompt(text, "English")}
             ]
             terminators = [
@@ -420,14 +355,7 @@ class UnifiedAudioConverter:
             json_match = re.search(pattern, partial_text)
             if json_match:
-                conversation_json = json.loads(json_match.group())
-                # 한국어가 선택된 경우 번역 수행
-                if language == "Korean":
-                    print("한국어 번역 중...")
-                    conversation_json = self.translate_to_korean(conversation_json)
-                return conversation_json
             else:
                 raise ValueError("No valid JSON found in legacy local response")
@@ -455,13 +383,16 @@ class UnifiedAudioConverter:
             raise RuntimeError("API mode not initialized")
         try:
-            # 영어로 대화 생성
-            system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations."
             chat_completion = self.llm_client.chat.completions.create(
                 messages=[
                     {"role": "system", "content": system_message},
-                    {"role": "user", "content": self._build_prompt(text, "English")}
                 ],
                 model=self.config.api_model_name,
             )
@@ -472,14 +403,7 @@ class UnifiedAudioConverter:
             if not json_match:
                 raise ValueError("No valid JSON found in response")
-            conversation_json = json.loads(json_match.group())
-            # 한국어가 선택된 경우 번역 수행
-            if language == "Korean":
-                print("한국어 번역 중...")
-                conversation_json = self.translate_to_korean(conversation_json)
-            return conversation_json
         except Exception as e:
             raise RuntimeError(f"Failed to extract conversation: {e}")
@@ -865,7 +789,6 @@ with gr.Blocks(theme='soft', title="URL to Podcast Converter") as demo:
         - **Primary**: Local LLM ({converter.config.local_model_name}) - Runs on your device
         - **Fallback**: API LLM ({converter.config.api_model_name}) - Used when local fails
         - **Status**: {"✅ Llama CPP Available" if LLAMA_CPP_AVAILABLE else "❌ Llama CPP Not Available - Install llama-cpp-python"}
-        - **한국어 지원**: 영어 대화 생성 후 자연스러운 한국어 구어체로 자동 번역
         """)
     with gr.Row():
@@ -881,7 +804,7 @@ with gr.Blocks(theme='soft', title="URL to Podcast Converter") as demo:
                 choices=["English", "Korean"],
                 value="English",
                 label="Language / 언어",
-                info="Select output language / 출력 언어를 선택하세요 (한국어 선택 시 자동 번역)"
             )
             mode_selector = gr.Radio(
@@ -911,7 +834,6 @@ with gr.Blocks(theme='soft', title="URL to Podcast Converter") as demo:
                 **한국어 지원:**
                 - 🇰🇷 한국어 선택 시 Edge-TTS만 사용 가능합니다
-                - 📝 영어로 대화 생성 후 자연스러운 ���국어 구어체로 자동 번역됩니다
                 """)
     convert_btn = gr.Button("🎯 Generate Conversation / 대화 생성", variant="primary", size="lg")
@@ -946,45 +868,12 @@ with gr.Blocks(theme='soft', title="URL to Podcast Converter") as demo:
                 visible=True
             )
-    # TTS 엔진별 설명 및 설치 안내 추가
-    with gr.Row():
-        gr.Markdown("""
-        ### TTS Engine Details / TTS 엔진 상세정보:
-        - **Edge-TTS**: Microsoft's cloud TTS service with high-quality natural voices. Requires internet connection.
-          - 🇰🇷 **한국어 지원**: 자연스러운 한국어 음성 (여성: SunHi, 남성: Hyunsu)
-        - **Spark-TTS**: SparkAudio's local AI model (0.5B parameters) with zero-shot voice cloning capability.
-          - **Setup required**: Clone [Spark-TTS repository](https://github.com/SparkAudio/Spark-TTS) in current directory
-          - Features: Bilingual support (Chinese/English), controllable speech generation
-          - License: CC BY-NC-SA (Non-commercial use only)
-          - ⚠️ **한국어 미지원**
-        - **MeloTTS**: Local TTS with multiple voice options. GPU recommended for better performance.
-          - ⚠️ **한국어 미지원**
-        ### Local LLM Setup / 로컬 LLM 설정:
-        The system now uses **Private-BitSix-Mistral-Small-3.1-24B-Instruct** as the primary LLM, which runs locally on your device for privacy and independence. API fallback is available when needed.
-        로컬 디바이스에서 개인정보 보호와 독립성을 위해 **Private-BitSix-Mistral-Small-3.1-24B-Instruct**를 기본 LLM으로 사용합니다. 필요시 API 폴백이 제공됩니다.
-        ### 한국어 번역 기능 / Korean Translation Feature:
-        - 한국어를 선택하면 영어로 대화를 생성한 후 자연스러운 한국어 구어체로 자동 번역됩니다
-        - 한국적 표현과 친근한 말투를 사용하여 자연스러운 팟캐스트 대화를 만듭니다
-        - When Korean is selected, conversations are generated in English first, then automatically translated to natural Korean colloquial style
-        ### Spark-TTS Setup Instructions:
-        ```bash
-        git clone https://github.com/SparkAudio/Spark-TTS.git
-        cd Spark-TTS
-        pip install -r requirements.txt
-        ```
-        """)
     gr.Examples(
         examples=[
             ["https://huggingface.co/blog/openfree/cycle-navigator", "Local", "Edge-TTS", "English"],
-            ["https://arxiv.org/html/2505.16938v1", "Local", "Edge-TTS", "English"],
-            ["https://domeggook.com/55204552?from=popular100", "Local", "Edge-TTS", "Korean"],
-            ["https://www.wsj.com/articles/nvidia-pushes-further-into-cloud-with-gpu-marketplace-4fba6bdd","Local", "Edge-TTS", "English"],
         ],
         inputs=[url_input, mode_selector, tts_selector, language_selector],
         outputs=[conversation_output, status_output],

             {"role": "user", "content": self._build_prompt(text, language)}
         ]
     @spaces.GPU(duration=120)
     def extract_conversation_local(self, text: str, language: str = "English", progress=None) -> Dict:
         """Extract conversation using new local LLM (primary method)"""
             chat_template = self._get_messages_formatter_type(self.config.local_model_name)
             provider = LlamaCppPythonProvider(self.local_llm)
+            # 언어별 시스템 메시지
+            if language == "Korean":
+                system_message = "당신은 한국어로 팟캐스트 대화를 생성하는 전문가입니다. 자연스럽고 유익한 한국어 대화를 만들어주세요. JSON 형식으로만 응답하세요."
+            else:
+                system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations. Respond only in JSON format."
             agent = LlamaCppAgent(
                 provider,
             messages = BasicChatHistory()
+            prompt = self._build_prompt(text, language)
             response = agent.get_chat_response(
                 prompt,
                 llm_sampling_settings=settings,
             json_match = re.search(pattern, response)
             if json_match:
+                return json.loads(json_match.group())
             else:
                 raise ValueError("No valid JSON found in local LLM response")
         try:
             self.initialize_legacy_local_mode()
+            # 언어별 시스템 메시지
+            if language == "Korean":
+                system_message = "당신은 한국어로 팟캐스트 대화를 생성하는 전문가입니다. 자연스럽고 유익한 한국어 대화를 만들어주세요."
+            else:
+                system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations."
             chat = [
                 {"role": "system", "content": system_message},
+                {"role": "user", "content": self._build_prompt(text, language)}
             ]
             terminators = [
             json_match = re.search(pattern, partial_text)
             if json_match:
+                return json.loads(json_match.group())
             else:
                 raise ValueError("No valid JSON found in legacy local response")
             raise RuntimeError("API mode not initialized")
         try:
+            # 언어별 프롬프트 구성
+            if language == "Korean":
+                system_message = "당신은 한국어로 팟캐스트 대화를 생성하는 전문가입니다. 자연스럽고 유익한 한국어 대화를 만들어주세요."
+            else:
+                system_message = "You are an expert at creating podcast conversations in English. Create natural and informative English conversations."
             chat_completion = self.llm_client.chat.completions.create(
                 messages=[
                     {"role": "system", "content": system_message},
+                    {"role": "user", "content": self._build_prompt(text, language)}
                 ],
                 model=self.config.api_model_name,
             )
             if not json_match:
                 raise ValueError("No valid JSON found in response")
+            return json.loads(json_match.group())
         except Exception as e:
             raise RuntimeError(f"Failed to extract conversation: {e}")
         - **Primary**: Local LLM ({converter.config.local_model_name}) - Runs on your device
         - **Fallback**: API LLM ({converter.config.api_model_name}) - Used when local fails
         - **Status**: {"✅ Llama CPP Available" if LLAMA_CPP_AVAILABLE else "❌ Llama CPP Not Available - Install llama-cpp-python"}
         """)
     with gr.Row():
                 choices=["English", "Korean"],
                 value="English",
                 label="Language / 언어",
+                info="Select output language / 출력 언어를 선택하세요"
             )
             mode_selector = gr.Radio(
                 **한국어 지원:**
                 - 🇰🇷 한국어 선택 시 Edge-TTS만 사용 가능합니다
                 """)
     convert_btn = gr.Button("🎯 Generate Conversation / 대화 생성", variant="primary", size="lg")
                 visible=True
             )
     gr.Examples(
         examples=[
             ["https://huggingface.co/blog/openfree/cycle-navigator", "Local", "Edge-TTS", "English"],
+            ["https://www.bbc.com/news/technology-67988517", "Local", "Spark-TTS", "English"],
+            ["https://huggingface.co/papers/2505.14810", "Local", "Edge-TTS", "Korean"],
         ],
         inputs=[url_input, mode_selector, tts_selector, language_selector],
         outputs=[conversation_output, status_output],