ACE-Singer

Running on Zero

App Files Files Community

ginipick commited on 25 days ago

Commit

5f66fab

verified ·

1 Parent(s): 2b8dfa8

Update ui/components-backup2.py

Browse files

Files changed (1) hide show

ui/components-backup2.py +62 -252

ui/components-backup2.py CHANGED Viewed

@@ -15,24 +15,6 @@ import numpy as np
 import json
 from typing import Dict, List, Tuple, Optional
-# [ADDED] OpenAI API 설정
-try:
-    from openai import OpenAI
-    api_key = os.getenv("LLM_API")
-    if api_key:
-        client = OpenAI(api_key=api_key)
-        client_available = True
-        print("✅ OpenAI API client initialized successfully")
-    else:
-        client = None
-        client_available = False
-        print("⚠️ Warning: No OpenAI API key found. AI lyrics generation will be disabled.")
-        print("Set environment variable: export LLM_API='your-openai-api-key'")
-except Exception as e:
-    client = None
-    client_available = False
-    print(f"❌ Warning: Failed to initialize OpenAI client: {e}")
 TAG_DEFAULT = "funk, pop, soul, rock, melodic, guitar, drums, bass, keyboard, percussion, 105 BPM, energetic, upbeat, groovy, vibrant, dynamic"
 LYRIC_DEFAULT = """[verse]
 Neon lights they flicker bright
@@ -71,103 +53,6 @@ Catch the tune and hold it tight
 In this moment we take flight
 """
-# [ADDED] AI 작사 시스템 프롬프트
-LYRIC_SYSTEM_PROMPT = """너는 노래 가사를 작사하는 전문가 역할이다. 이용자가 입력하는 주제에 따라 이에 관련된 노래 가사를 작성하라. 가사의 규칙은 "[  ]"로 구분하여, 다음 예시를 참조하라.
-예시:
-[verse]
-Neon lights they flicker bright
-City hums in dead of night
-Rhythms pulse through concrete veins
-Lost in echoes of refrains
-[verse]
-Bassline groovin' in my chest
-Heartbeats match the city's zest
-Electric whispers fill the air
-Synthesized dreams everywhere
-[chorus]
-Turn it up and let it flow
-Feel the fire let it grow
-In this rhythm we belong
-Hear the night sing out our song
-[verse]
-Guitar strings they start to weep
-Wake the soul from silent sleep
-Every note a story told
-In this night we're bold and gold
-[bridge]
-Voices blend in harmony
-Lost in pure cacophony
-Timeless echoes timeless cries
-Soulful shouts beneath the skies
-[verse]
-Keyboard dances on the keys
-Melodies on evening breeze
-Catch the tune and hold it tight
-In this moment we take flight
-규칙:
-1. 반드시 [verse], [chorus], [bridge] 등의 구조 태그를 사용할 것
-2. 입력 언어와 동일한 언어로 가사를 작성할 것
-3. 각 섹션은 4-8줄 정도로 구성할 것
-4. 주제와 감정에 맞는 운율과 리듬감 있는 가사를 작성할 것"""
-# [ADDED] AI 작사 생성 함수
-def generate_lyrics_with_ai(theme: str, genre: str = None) -> str:
-    """AI를 사용하여 주제 기반 가사 생성"""
-    print(f"🎵 AI 작사 시작: 주제='{theme}', 장르='{genre}'")
-    if not client_available or client is None:
-        print("❌ OpenAI client not available, returning default lyrics")
-        return LYRIC_DEFAULT
-    if not theme or theme.strip() == "":
-        print("⚠️ Empty theme, returning default lyrics")
-        return LYRIC_DEFAULT
-    try:
-        # 장르 정보가 있으면 프롬프트에 추가
-        user_prompt = f"다음 주제로 노래 가사를 작성해주세요: {theme}"
-        if genre and genre != "Custom":
-            user_prompt += f"\n장르: {genre}"
-        print(f"📝 OpenAI API 호출 중...")
-        # [MODIFIED] 사용자가 제시한 API 형식을 표준 형식으로 변환
-        # 실제로는 client.responses.create가 아닌 client.chat.completions.create를 사용
-        response = client.chat.completions.create(
-            model="gpt-4o-mini",  # gpt-4.1-mini는 존재하지 않는 모델명이므로 gpt-4o-mini 사용
-            messages=[
-                {
-                    "role": "system",
-                    "content": LYRIC_SYSTEM_PROMPT
-                },
-                {
-                    "role": "user",
-                    "content": user_prompt
-                }
-            ],
-            temperature=0.8,
-            max_tokens=1500,
-            top_p=1
-        )
-        generated_lyrics = response.choices[0].message.content
-        print(f"✅ AI 작사 완료")
-        print(f"생성된 가사 미리보기: {generated_lyrics[:100]}...")
-        return generated_lyrics
-    except Exception as e:
-        print(f"❌ AI 작사 생성 오류: {e}")
-        import traceback
-        print(f"상세 오류: {traceback.format_exc()}")
-        return LYRIC_DEFAULT
 # 확장된 장르 프리셋 (기존 + 개선된 태그)
 GENRE_PRESETS = {
     "Modern Pop": "pop, synth, drums, guitar, 120 bpm, upbeat, catchy, vibrant, female vocals, polished vocals, radio-ready, commercial, layered vocals",
@@ -335,35 +220,27 @@ def create_enhanced_process_func(original_func):
         lora_name_or_path="none", multi_seed_mode="Single",
         enable_smart_enhancement=True, genre_preset="Custom", **kwargs
     ):
-        print(f"🎵 Enhanced generation started")
-        print(f"Parameters: duration={audio_duration}, prompt='{prompt[:50]}...', multi_seed={multi_seed_mode}")
         # 스마트 프롬프트 확장
         if enable_smart_enhancement and genre_preset != "Custom":
-            enhanced_prompt = enhance_prompt_with_genre(prompt, genre_preset)
-            print(f"Enhanced prompt: {enhanced_prompt[:100]}...")
-        else:
-            enhanced_prompt = prompt
         # 캐시 확인
         cache_params = {
-            'prompt': enhanced_prompt, 'lyrics': lyrics, 'audio_duration': audio_duration,
             'infer_step': infer_step, 'guidance_scale': guidance_scale
         }
         cached_result = generation_cache.get_cached_result(cache_params)
         if cached_result:
-            print("Using cached result")
             return cached_result
         # 다중 시드 생성
         num_candidates = MULTI_SEED_OPTIONS.get(multi_seed_mode, 1)
-        print(f"Generating {num_candidates} candidates")
         if num_candidates == 1:
             # 기존 함수 호출
             result = original_func(
-                audio_duration, enhanced_prompt, lyrics, infer_step, guidance_scale,
                 scheduler_type, cfg_type, omega_scale, manual_seeds,
                 guidance_interval, guidance_interval_decay, min_guidance_scale,
                 use_erg_tag, use_erg_lyric, use_erg_diffusion, oss_steps,
@@ -371,19 +248,58 @@ def create_enhanced_process_func(original_func):
                 ref_audio_strength, ref_audio_input, lora_name_or_path, **kwargs
             )
         else:
-            # 다중 시드 생성을 위한 임시 구현
-            result = original_func(
-                audio_duration, enhanced_prompt, lyrics, infer_step, guidance_scale,
-                scheduler_type, cfg_type, omega_scale, manual_seeds,
-                guidance_interval, guidance_interval_decay, min_guidance_scale,
-                use_erg_tag, use_erg_lyric, use_erg_diffusion, oss_steps,
-                guidance_scale_text, guidance_scale_lyric, audio2audio_enable,
-                ref_audio_strength, ref_audio_input, lora_name_or_path, **kwargs
-            )
         # 결과 캐시
         generation_cache.cache_result(cache_params, result)
-        print(f"Generation completed")
         return result
     return enhanced_func
@@ -409,41 +325,8 @@ def create_output_ui(task_name="Text2Music"):
     return outputs, input_params_json
 def dump_func(*args):
-    """더미 함수 - 실제 음악 생성 대신 로그만 출력"""
-    print(f"🎵 Dummy function called with {len(args)} arguments")
-    if args:
-        print(f"Parameters preview: duration={args[0] if len(args) > 0 else 'N/A'}, prompt='{args[1][:50] if len(args) > 1 else 'N/A'}...'")
-    # 가짜 결과 반환 (실제 구현에서는 진짜 음악 생성 결과)
-    dummy_result = [
-        None,  # 오디오 파일 경로 (None이면 오디오 생성 안됨)
-        {
-            "prompt": args[1] if len(args) > 1 else "test",
-            "lyrics": args[2] if len(args) > 2 else "test lyrics",
-            "audio_duration": args[0] if len(args) > 0 else 30,
-            "status": "완료 (더미 모드 - 실제 음악 생성 안됨)",
-            "infer_step": args[3] if len(args) > 3 else 150,
-            "guidance_scale": args[4] if len(args) > 4 else 15.0,
-            "scheduler_type": args[5] if len(args) > 5 else "euler",
-            "cfg_type": args[6] if len(args) > 6 else "apg",
-            "omega_scale": args[7] if len(args) > 7 else 10.0,
-            "actual_seeds": [1234],
-            "guidance_interval": args[9] if len(args) > 9 else 0.5,
-            "guidance_interval_decay": args[10] if len(args) > 10 else 0.0,
-            "min_guidance_scale": args[11] if len(args) > 11 else 3.0,
-            "use_erg_tag": args[12] if len(args) > 12 else True,
-            "use_erg_lyric": args[13] if len(args) > 13 else False,
-            "use_erg_diffusion": args[14] if len(args) > 14 else True,
-            "oss_steps": [],
-            "guidance_scale_text": args[16] if len(args) > 16 else 0.0,
-            "guidance_scale_lyric": args[17] if len(args) > 17 else 0.0,
-            "audio2audio_enable": args[18] if len(args) > 18 else False,
-            "ref_audio_strength": args[19] if len(args) > 19 else 0.5,
-            "ref_audio_input": args[20] if len(args) > 20 else None,
-            "audio_path": None
-        }
-    ]
-    return dummy_result
 def create_text2music_ui(
     gr,
@@ -568,29 +451,6 @@ def create_text2music_ui(
                         placeholder="콤마로 구분된 태그들...",
                     )
-            # [ADDED] AI 작사 시스템 UI
-            with gr.Group():
-                gr.Markdown("""### 🤖 AI 작사 시스템
-                <center>주제를 입력하고 'AI 작사' 버튼을 클릭하면 자동으로 가사가 생성됩니다.</center>""")
-                with gr.Row():
-                    lyric_theme_input = gr.Textbox(
-                        label="작사 주제",
-                        placeholder="예: 첫사랑의 설렘, 이별의 아픔, 군대가는 남자의 한숨, 희망찬 내일...",
-                        scale=3,
-                        interactive=True
-                    )
-                    generate_lyrics_btn = gr.Button("🤖 AI 작사", variant="secondary", scale=1)
-                # API 상태 표시
-                api_status = gr.Textbox(
-                    value="✅ AI 작사 기능 활성화됨" if client_available else "❌ API 키가 설정되지 않음 (export LLM_API='your-key')",
-                    label="API 상태",
-                    interactive=False,
-                    max_lines=1,
-                    scale=1
-                )
             with gr.Group():
                 gr.Markdown("""### 📝 가사 입력
                 <center>구조 태그 [verse], [chorus], [bridge] 사용을 권장합니다.<br>[instrumental] 또는 [inst]를 사용하면 연주곡을 생성합니다.</center>""")
@@ -722,27 +582,6 @@ def create_text2music_ui(
             text2music_bnt = gr.Button("🎵 Generate Music", variant="primary", size="lg")
-            # [ADDED] AI 작사 이벤트 핸들러
-            def handle_ai_lyrics_generation(theme, genre):
-                """AI 작사 버튼 클릭 처리"""
-                print(f"🤖 AI 작사 버튼 클릭: 주제='{theme}', 장르='{genre}'")
-                if not theme or theme.strip() == "":
-                    return "⚠️ 작사 주제를 입력해주세요!"
-                try:
-                    generated_lyrics = generate_lyrics_with_ai(theme, genre)
-                    return generated_lyrics
-                except Exception as e:
-                    print(f"작사 생성 중 오류: {e}")
-                    return f"❌ 작사 생성 중 오류가 발생했습니다: {str(e)}"
-            generate_lyrics_btn.click(
-                fn=handle_ai_lyrics_generation,
-                inputs=[lyric_theme_input, genre_preset],
-                outputs=[lyrics]
-            )
             # 모든 UI 요소가 정의된 후 이벤트 핸들러 설정
             genre_preset.change(
                 fn=update_tags_from_preset,
@@ -1446,7 +1285,7 @@ def create_main_demo_ui(
     load_data_func=dump_func,
 ):
     with gr.Blocks(
-        title="ACE-Step Model 1.0 DEMO - Enhanced with AI Lyrics",
         theme=gr.themes.Soft(),
         css="""
         .gradio-container {
@@ -1458,20 +1297,13 @@ def create_main_demo_ui(
             border-radius: 8px;
             margin: 5px 0;
         }
-        .ai-lyrics-section {
-            background: linear-gradient(45deg, #f0fff0, #e6ffe6);
-            padding: 15px;
-            border-radius: 10px;
-            margin: 10px 0;
-            border: 2px solid #90EE90;
-        }
         """
     ) as demo:
         gr.Markdown(
             """
-            <h1 style="text-align: center;">🎵 ACE-Step PRO with AI Lyrics</h1>
             <div style="text-align: center; margin: 20px;">
-                <p><strong>🚀 새로운 기능:</strong> 🤖 AI 작사 | 품질 프리셋 | 다중 생성 | 스마트 프롬프트 | 실시간 프리뷰 | 품질 점수</p>
                 <p>
                     <a href="https://ace-step.github.io/" target='_blank'>Project</a> |
                     <a href="https://huggingface.co/ACE-Step/ACE-Step-v1-3.5B">Checkpoints</a> |
@@ -1485,32 +1317,19 @@ def create_main_demo_ui(
         with gr.Accordion("📖 사용법 가이드", open=False):
             gr.Markdown("""
             ### 🎯 빠른 시작
-            1. **🤖 AI 작사**: 주제를 입력하고 'AI 작사' 버튼을 클릭하면 자동으로 가사가 생성됩니다
-            2. **장르 선택**: 원하는 음악 장르를 선택하면 자동으로 최적화된 태그가 적용됩니다
-            3. **품질 설정**: Draft(빠름) → Standard(권장) → High Quality → Ultra 중 선택
-            4. **다중 생성**: "Best of 3/5/10" 선택하면 여러 번 생성하여 최고 품질을 자동 선택합니다
-            5. **프리뷰**: 전체 생성 전 10초 프리뷰로 빠르게 확인할 수 있습니다
-            ### 🤖 AI 작사 기능
-            - **다국어 지원**: 한국어, 영어 등 입력 언어와 동일한 언어로 가사 생성
-            - **주제 예시**: "첫사랑의 설렘", "이별의 아픔", "군대가는 남자의 한숨", "희망찬 내일"
-            - **구조 태그**: [verse], [chorus], [bridge] 태그가 자동으로 포함됩니다
-            - **장르 연동**: 선택한 장르에 맞는 스타일의 가사가 생성됩니다
             ### 💡 품질 향상 팁
             - **고품질 생성**: "High Quality" + "Best of 5" 조합 추천
             - **빠른 테스트**: "Draft" + "프리뷰" 기능 활용
             - **장르 특화**: 장르 프리셋 선택 후 "스마트 향상" 체크
             - **가사 구조**: [verse], [chorus], [bridge] 태그 적극 활용
-            ### ⚙️ API 설정
-            AI 작사 기능을 사용하려면 환경변수에 OpenAI API 키를 설정해야 합니다:
-            ```bash
-            export LLM_API="your-openai-api-key"
-            ```
             """)
-        with gr.Tab("🎵 Enhanced Text2Music with AI Lyrics"):
             create_text2music_ui(
                 gr=gr,
                 text2music_process_func=text2music_process_func,
@@ -1521,15 +1340,6 @@ def create_main_demo_ui(
 if __name__ == "__main__":
-    print("🚀 ACE-Step PRO with AI Lyrics 시작 중...")
-    # API 키 상태 확인
-    if client_available:
-        print("✅ OpenAI API 사용 가능 - AI 작사 기능 활성화됨")
-    else:
-        print("❌ OpenAI API 사용 불가 - 환경변수를 확인하세요")
-        print("설정 방법: export LLM_API='your-openai-api-key'")
     demo = create_main_demo_ui()
     demo.launch(
         server_name="0.0.0.0",

 import json
 from typing import Dict, List, Tuple, Optional
 TAG_DEFAULT = "funk, pop, soul, rock, melodic, guitar, drums, bass, keyboard, percussion, 105 BPM, energetic, upbeat, groovy, vibrant, dynamic"
 LYRIC_DEFAULT = """[verse]
 Neon lights they flicker bright
 In this moment we take flight
 """
 # 확장된 장르 프리셋 (기존 + 개선된 태그)
 GENRE_PRESETS = {
     "Modern Pop": "pop, synth, drums, guitar, 120 bpm, upbeat, catchy, vibrant, female vocals, polished vocals, radio-ready, commercial, layered vocals",
         lora_name_or_path="none", multi_seed_mode="Single",
         enable_smart_enhancement=True, genre_preset="Custom", **kwargs
     ):
         # 스마트 프롬프트 확장
         if enable_smart_enhancement and genre_preset != "Custom":
+            prompt = enhance_prompt_with_genre(prompt, genre_preset)
         # 캐시 확인
         cache_params = {
+            'prompt': prompt, 'lyrics': lyrics, 'audio_duration': audio_duration,
             'infer_step': infer_step, 'guidance_scale': guidance_scale
         }
         cached_result = generation_cache.get_cached_result(cache_params)
         if cached_result:
             return cached_result
         # 다중 시드 생성
         num_candidates = MULTI_SEED_OPTIONS.get(multi_seed_mode, 1)
         if num_candidates == 1:
             # 기존 함수 호출
             result = original_func(
+                audio_duration, prompt, lyrics, infer_step, guidance_scale,
                 scheduler_type, cfg_type, omega_scale, manual_seeds,
                 guidance_interval, guidance_interval_decay, min_guidance_scale,
                 use_erg_tag, use_erg_lyric, use_erg_diffusion, oss_steps,
                 ref_audio_strength, ref_audio_input, lora_name_or_path, **kwargs
             )
         else:
+            # 다중 시드 생성 및 최적 선택
+            candidates = []
+            for i in range(num_candidates):
+                seed = random.randint(1, 10000)
+                try:
+                    result = original_func(
+                        audio_duration, prompt, lyrics, infer_step, guidance_scale,
+                        scheduler_type, cfg_type, omega_scale, str(seed),
+                        guidance_interval, guidance_interval_decay, min_guidance_scale,
+                        use_erg_tag, use_erg_lyric, use_erg_diffusion, oss_steps,
+                        guidance_scale_text, guidance_scale_lyric, audio2audio_enable,
+                        ref_audio_strength, ref_audio_input, lora_name_or_path, **kwargs
+                    )
+                    if result and len(result) > 0:
+                        audio_path = result[0]  # 첫 번째 결과가 오디오 파일 경로
+                        if audio_path and os.path.exists(audio_path):
+                            quality_score = calculate_quality_score(audio_path)
+                            candidates.append({
+                                "result": result,
+                                "quality_score": quality_score,
+                                "seed": seed
+                            })
+                except Exception as e:
+                    print(f"Generation {i+1} failed: {e}")
+                    continue
+            if candidates:
+                # 최고 품질 선택
+                best_candidate = max(candidates, key=lambda x: x["quality_score"])
+                result = best_candidate["result"]
+                # 품질 정보 추가
+                if len(result) > 1 and isinstance(result[1], dict):
+                    result[1]["quality_score"] = best_candidate["quality_score"]
+                    result[1]["selected_seed"] = best_candidate["seed"]
+                    result[1]["candidates_count"] = len(candidates)
+            else:
+                # 모든 생성 실패시 기본 생성
+                result = original_func(
+                    audio_duration, prompt, lyrics, infer_step, guidance_scale,
+                    scheduler_type, cfg_type, omega_scale, manual_seeds,
+                    guidance_interval, guidance_interval_decay, min_guidance_scale,
+                    use_erg_tag, use_erg_lyric, use_erg_diffusion, oss_steps,
+                    guidance_scale_text, guidance_scale_lyric, audio2audio_enable,
+                    ref_audio_strength, ref_audio_input, lora_name_or_path, **kwargs
+                )
         # 결과 캐시
         generation_cache.cache_result(cache_params, result)
         return result
     return enhanced_func
     return outputs, input_params_json
 def dump_func(*args):
+    print(args)
+    return []
 def create_text2music_ui(
     gr,
                         placeholder="콤마로 구분된 태그들...",
                     )
             with gr.Group():
                 gr.Markdown("""### 📝 가사 입력
                 <center>구조 태그 [verse], [chorus], [bridge] 사용을 권장합니다.<br>[instrumental] 또는 [inst]를 사용하면 연주곡을 생성합니다.</center>""")
             text2music_bnt = gr.Button("🎵 Generate Music", variant="primary", size="lg")
             # 모든 UI 요소가 정의된 후 이벤트 핸들러 설정
             genre_preset.change(
                 fn=update_tags_from_preset,
     load_data_func=dump_func,
 ):
     with gr.Blocks(
+        title="ACE-Step Model 1.0 DEMO - Enhanced",
         theme=gr.themes.Soft(),
         css="""
         .gradio-container {
             border-radius: 8px;
             margin: 5px 0;
         }
         """
     ) as demo:
         gr.Markdown(
             """
+            <h1 style="text-align: center;">🎵 ACE-Step PRO</h1>
             <div style="text-align: center; margin: 20px;">
+                <p><strong>🚀 새로운 기능:</strong> 품질 프리셋 | 다중 생성 | 스마트 프롬프트 | 실시간 프리뷰 | 품질 점수</p>
                 <p>
                     <a href="https://ace-step.github.io/" target='_blank'>Project</a> |
                     <a href="https://huggingface.co/ACE-Step/ACE-Step-v1-3.5B">Checkpoints</a> |
         with gr.Accordion("📖 사용법 가이드", open=False):
             gr.Markdown("""
             ### 🎯 빠른 시작
+            1. **장르 선택**: 원하는 음악 장르를 선택하면 자동으로 최적화된 태그가 적용됩니다
+            2. **품질 설정**: Draft(빠름) → Standard(권장) → High Quality → Ultra 중 선택
+            3. **다중 생성**: "Best of 3/5/10" 선택하면 여러 번 생성하여 최고 품질을 자동 선택합니다
+            4. **프리뷰**: 전체 생성 전 10초 프리뷰로 빠르게 확인할 수 있습니다
             ### 💡 품질 향상 팁
             - **고품질 생성**: "High Quality" + "Best of 5" 조합 추천
             - **빠른 테스트**: "Draft" + "프리뷰" 기능 활용
             - **장르 특화**: 장르 프리셋 선택 후 "스마트 향상" 체크
             - **가사 구조**: [verse], [chorus], [bridge] 태그 적극 활용
             """)
+        with gr.Tab("🎵 Enhanced Text2Music"):
             create_text2music_ui(
                 gr=gr,
                 text2music_process_func=text2music_process_func,
 if __name__ == "__main__":
     demo = create_main_demo_ui()
     demo.launch(
         server_name="0.0.0.0",