SOMA-Oriental

Running

App Files Files Community

aiqtech commited on Jun 27

Commit

624bbb3

verified ·

1 Parent(s): 19f25c1

Update app.py

Browse files

Files changed (1) hide show

app.py +226 -113

app.py CHANGED Viewed

@@ -195,24 +195,32 @@ class LLMCollaborativeSystem:
 4. 명확한 결론과 다음 단계를 제시하세요
 5. 전문적이고 완성도 높은 최종 보고서 형식으로 작성하세요"""
-    def create_evaluator_prompt(self, user_query: str, supervisor_responses: List[str], researcher_response: str, executor_responses: List[str]) -> str:
         """평가자 AI 프롬프트 생성"""
         return f"""당신은 전체 협력 과정과 결과를 평가하는 평가자 AI입니다.
 사용자 질문: {user_query}
 감독자 AI의 분석 및 지시:
 - 초기 분석: {supervisor_responses[0]}
-- 실행 지시: {supervisor_responses[1]}
-- 검토 피드백: {supervisor_responses[2]}
 조사자 AI의 조사 결과:
 {researcher_response}
 실행자 AI의 구현:
 - 초기 구현: {executor_responses[0]}
-- 최종 보고서: {executor_responses[1]}
 위 전체 과정을 평가하여:
 1. **품질 평가**: 각 AI의 답변 품질과 역할 수행도를 평가하세요 (10점 만점)
 2. **협력 효과성**: AI 간 협력이 얼마나 효과적이었는지 평가하세요
@@ -485,7 +493,7 @@ class LLMCollaborativeSystem:
             generate_content_config = types.GenerateContentConfig(
                 temperature=0.7,
                 top_p=0.8,
-                max_output_tokens=2048,
                 response_mime_type="text/plain"
             )
@@ -768,7 +776,7 @@ class LLMCollaborativeSystem:
             payload = {
                 "model": self.model_id,
                 "messages": full_messages,
-                "max_tokens": 2048,
                 "temperature": 0.7,
                 "top_p": 0.8,
                 "stream": True,
@@ -825,7 +833,7 @@ def process_query_streaming(user_query: str, llm_mode: str):
     global internal_history
     if not user_query:
-        return "", "", "", "", "❌ 질문을 입력해주세요."
     # LLM 모드 설정
     llm_system.set_llm_mode(llm_mode)
@@ -845,7 +853,7 @@ def process_query_streaming(user_query: str, llm_mode: str):
         ):
             supervisor_initial_response += chunk
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{supervisor_initial_response}"
-            yield supervisor_text, "", "", "", "🔄 감독자 AI가 분석 중..."
         all_responses["supervisor"].append(supervisor_initial_response)
@@ -855,7 +863,7 @@ def process_query_streaming(user_query: str, llm_mode: str):
         # 2단계: 브레이브 검색 수행
         researcher_text = "[웹 검색] 🔍 검색 중...\n"
-        yield supervisor_text, researcher_text, "", "", "🔍 웹 검색 수행 중..."
         search_results = {}
         total_search_count = 0
@@ -867,7 +875,7 @@ def process_query_streaming(user_query: str, llm_mode: str):
                 search_results[keyword] = results
                 total_search_count += len(results)
                 researcher_text += f"✓ '{keyword}' 검색 완료 ({len(results)}개 결과)\n"
-                yield supervisor_text, researcher_text, "", "", f"🔍 '{keyword}' 검색 중..."
             # 동의어로 추가 검색
             synonyms = llm_system.generate_synonyms(keyword)
@@ -877,13 +885,13 @@ def process_query_streaming(user_query: str, llm_mode: str):
                     search_results[f"{keyword} ({synonym})"] = syn_results
                     total_search_count += len(syn_results)
                     researcher_text += f"✓ 동의어 '{synonym}' 검색 완료 ({len(syn_results)}개 결과)\n"
-                    yield supervisor_text, researcher_text, "", "", f"🔍 동의어 '{synonym}' 검색 중..."
         researcher_text += f"\n📊 총 {total_search_count}개의 검색 결과 수집 완료\n"
         # URL 콘텐츠 가져오기 (상위 3개)
         researcher_text += "\n[콘텐츠 분석] 📖 주요 웹페이지 내용 분석 중...\n"
-        yield supervisor_text, researcher_text, "", "", "📖 웹페이지 내용 분석 중..."
         content_analyzed = 0
         for keyword, results in search_results.items():
@@ -898,7 +906,7 @@ def process_query_streaming(user_query: str, llm_mode: str):
                         result['content_preview'] = content[:500]  # 미리보기 저장
                         content_analyzed += 1
                         researcher_text += f"✓ 콘텐츠 분석 완료: {url[:50]}...\n"
-                        yield supervisor_text, researcher_text, "", "", f"📖 분석 중: {url[:30]}..."
         # 3단계: 조사자 AI가 검색 결과 정리
         researcher_prompt = llm_system.create_researcher_prompt(user_query, supervisor_initial_response, search_results)
@@ -911,12 +919,57 @@ def process_query_streaming(user_query: str, llm_mode: str):
         ):
             researcher_response += chunk
             researcher_text = f"[조사 결과 정리] - {datetime.now().strftime('%H:%M:%S')}\n{researcher_response}"
-            yield supervisor_text, researcher_text, "", "", "📝 조사자 AI가 정리 중..."
         all_responses["researcher"].append(researcher_response)
-        # 4단계: 감독자 AI가 조사 내용 기반으로 실행 지시
-        supervisor_execution_prompt = llm_system.create_supervisor_execution_prompt(user_query, researcher_response)
         supervisor_execution_response = ""
         supervisor_text += "\n\n---\n\n[실행 지시] 🔄 생성 중...\n"
@@ -927,11 +980,11 @@ def process_query_streaming(user_query: str, llm_mode: str):
             supervisor_execution_response += chunk
             temp_text = f"{all_responses['supervisor'][0]}\n\n---\n\n[실행 지시] - {datetime.now().strftime('%H:%M:%S')}\n{supervisor_execution_response}"
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
-            yield supervisor_text, researcher_text, "", "", "🎯 감독자 AI가 지시 중..."
         all_responses["supervisor"].append(supervisor_execution_response)
-        # 5단계: 실행자 AI가 조사 내용과 지시를 기반으로 초기 구현
         executor_prompt = llm_system.create_executor_prompt(user_query, supervisor_execution_response, researcher_response)
         executor_response = ""
@@ -942,41 +995,117 @@ def process_query_streaming(user_query: str, llm_mode: str):
         ):
             executor_response += chunk
             executor_text = f"[초기 구현] - {datetime.now().strftime('%H:%M:%S')}\n{executor_response}"
-            yield supervisor_text, researcher_text, executor_text, "", "🔧 실행자 AI가 구현 중..."
         all_responses["executor"].append(executor_response)
-        # 6단계: 감독자 AI 검토 및 피드백
-        review_prompt = f"""당신은 거시적 관점에서 분석하고 지도하는 감독자 AI입니다.
 사용자 질문: {user_query}
-실행자 AI의 답변:
 {executor_response}
-이 답변을 검토하고 개선점과 추가 고려사항을 제시해주세요. 구체적이고 실행 가능한 개선 방안을 제시하세요."""
-        review_response = ""
-        supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['supervisor'][0]}\n\n---\n\n[실행 지시] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['supervisor'][1]}\n\n---\n\n[검토 및 피드백] 🔄 생성 중...\n"
         for chunk in llm_system.call_llm_streaming(
-            [{"role": "user", "content": review_prompt}],
             "supervisor"
         ):
-            review_response += chunk
-            temp_text = f"{all_responses['supervisor'][0]}\n\n---\n\n[실행 지시] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['supervisor'][1]}\n\n---\n\n[검토 및 피드백] - {datetime.now().strftime('%H:%M:%S')}\n{review_response}"
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
-            yield supervisor_text, researcher_text, executor_text, "", "🔄 감독자 AI가 검토 중..."
-        all_responses["supervisor"].append(review_response)
-        # 7단계: 실행자 AI 최종 보고서 (피드백 반영)
-        final_executor_prompt = llm_system.create_executor_final_prompt(
-            user_query,
-            executor_response,
-            review_response,
-            researcher_response
         )
         final_executor_response = ""
         executor_text += "\n\n---\n\n[최종 보고서] 🔄 작성 중...\n"
@@ -987,95 +1116,50 @@ def process_query_streaming(user_query: str, llm_mode: str):
             final_executor_response += chunk
             temp_text = f"[초기 구현] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['executor'][0]}\n\n---\n\n[최종 보고서] - {datetime.now().strftime('%H:%M:%S')}\n{final_executor_response}"
             executor_text = temp_text
-            yield supervisor_text, researcher_text, executor_text, "", "📄 최종 보고서 작성 중..."
         all_responses["executor"].append(final_executor_response)
-        # 8단계: 평가자 AI가 전체 과정 평가
-        evaluator_prompt = llm_system.create_evaluator_prompt(
-            user_query,
-            all_responses["supervisor"],
-            all_responses["researcher"][0],
-            all_responses["executor"]
-        )
-        evaluator_response = ""
-        evaluator_text = "[전체 평가] 🔄 평가 중...\n"
-        for chunk in llm_system.call_llm_streaming(
-            [{"role": "user", "content": evaluator_prompt}],
-            "evaluator"
-        ):
-            evaluator_response += chunk
-            evaluator_text = f"[전체 평가] - {datetime.now().strftime('%H:%M:%S')}\n{evaluator_response}"
-            yield supervisor_text, researcher_text, executor_text, evaluator_text, "📊 평가자 AI가 평가 중..."
-        all_responses["evaluator"].append(evaluator_response)
         # 최종 결과 생성 (최종 보고서를 메인으로)
         final_summary = f"""## 🎯 최종 종합 보고서
 ### 📌 사용자 질문
 {user_query}
-### 📄 최종 보고서 (실행자 AI - 피드백 반영)
 {final_executor_response}
 ---
 ### 📊 전체 프로세스 평가 (평가자 AI)
-{evaluator_response}
 ---
-<details>
-<summary>📋 전체 협력 과정 보기</summary>
-#### 🔍 거시적 분석 (감독자 AI)
-{all_responses['supervisor'][0]}
-#### 📚 조사 결과 (조사자 AI)
-{researcher_response}
-#### 🎯 실행 지시 (감독자 AI)
-{all_responses['supervisor'][1]}
-#### 💡 초기 구현 (실행자 AI)
-{executor_response}
-#### ✨ 검토 및 개선사항 (감독자 AI)
-{review_response}
-</details>
 ---
-*이 보고서는 {'Gemini 2.5 Pro' if llm_system.use_gemini else '기본 LLM'}를 사용하여 웹 검색과 AI 협력을 통해 작성되었습니다.*"""
         # 내부 히스토리 업데이트 (UI에는 표시하지 않음)
         internal_history.append((user_query, final_summary))
-        # 최종 요약만 표시
-        display_summary = f"""## 🎯 최종 결과
-### 📄 실행 보고서
-{final_executor_response}
-### 📊 평가 요약
-{evaluator_response.split('### 5️⃣')[1] if '### 5️⃣' in evaluator_response else evaluator_response[-500:]}
----
-*{'Gemini 2.5 Pro' if llm_system.use_gemini else '기본 LLM'} 사용 | 4개 AI 협력 완료*"""
-        yield supervisor_text, researcher_text, executor_text, evaluator_text, "✅ 최종 보고서 완성!"
     except Exception as e:
         error_msg = f"❌ 처리 중 오류: {str(e)}"
-        yield "", "", "", "", error_msg
 def clear_all():
     """모든 내용 초기화"""
     global internal_history
     internal_history = []
-    return "", "", "", "", "🔄 초기화되었습니다."
 # Gradio 인터페이스
 css = """
@@ -1102,12 +1186,22 @@ css = """
     padding-left: 10px !important;
     background-color: #fffbeb !important;
 }
 """
-with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css) as app:
     gr.Markdown(
         f"""
-        # 🤝 협력적 LLM 시스템 (4-AI 협업 + 평가자)
         """
     )
@@ -1122,10 +1216,13 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
             - **평가자 AI**: 전체 과정 평가와 개선점 제시
             ### 🌟 주요 기능
             - 20개 검색 결과와 동의어 검색
             - 신뢰도 기반 정보 평가
-            - 실시간 협업과 피드백 반영
-            - 종합적인 품질 평가
             """)
             # LLM 선택 옵션
@@ -1150,7 +1247,20 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
                 label="상태",
                 interactive=False,
                 value="대기 중...",
-                max_lines=1
             )
     # AI 출력들 - 2x2 그리드
@@ -1160,8 +1270,8 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
             gr.Markdown("### 🧠 감독자 AI (거시적 분석)")
             supervisor_output = gr.Textbox(
                 label="",
-                lines=15,
-                max_lines=20,
                 interactive=False,
                 elem_classes=["supervisor-box"]
             )
@@ -1170,8 +1280,8 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
             gr.Markdown("### 🔍 조사자 AI (웹 검색 & 정리)")
             researcher_output = gr.Textbox(
                 label="",
-                lines=15,
-                max_lines=20,
                 interactive=False,
                 elem_classes=["researcher-box"]
             )
@@ -1182,8 +1292,8 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
             gr.Markdown("### 👁️ 실행자 AI (미시적 구현)")
             executor_output = gr.Textbox(
                 label="",
-                lines=15,
-                max_lines=20,
                 interactive=False,
                 elem_classes=["executor-box"]
             )
@@ -1192,8 +1302,8 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
             gr.Markdown("### 📊 평가자 AI (전체 평가)")
             evaluator_output = gr.Textbox(
                 label="",
-                lines=15,
-                max_lines=20,
                 interactive=False,
                 elem_classes=["evaluator-box"]
             )
@@ -1202,10 +1312,13 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
     gr.Examples(
         examples=[
             "기계학습 모델의 성능을 향상시키는 최신 방법은?",
-            "2024년 효과적인 프로젝트 관리 도구와 전략은?",
             "지속 가능한 비즈니스 모델의 최신 트렌드는?",
             "최신 데이터 시각화 도구와 기법은?",
-            "원격 팀의 생산성을 높이는 검증된 방법은?"
         ],
         inputs=user_input,
         label="💡 예제 질문"
@@ -1215,7 +1328,7 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
     submit_btn.click(
         fn=process_query_streaming,
         inputs=[user_input, llm_mode],
-        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, status_text]
     ).then(
         fn=lambda: "",
         outputs=[user_input]
@@ -1224,7 +1337,7 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
     user_input.submit(
         fn=process_query_streaming,
         inputs=[user_input, llm_mode],
-        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, status_text]
     ).then(
         fn=lambda: "",
         outputs=[user_input]
@@ -1232,7 +1345,7 @@ with gr.Blocks(title="협력적 LLM 시스템", theme=gr.themes.Soft(), css=css)
     clear_btn.click(
         fn=clear_all,
-        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, status_text]
     )

 4. 명확한 결론과 다음 단계를 제시하세요
 5. 전문적이고 완성도 높은 최종 보고서 형식으로 작성하세요"""
+    def create_evaluator_prompt(self, user_query: str, supervisor_responses: List[str], researcher_response: str, executor_responses: List[str], evaluator_responses: List[str] = None) -> str:
         """평가자 AI 프롬프트 생성"""
+        evaluator_history = ""
+        if evaluator_responses and len(evaluator_responses) > 0:
+            evaluator_history = f"""
+평가자 AI의 이전 평가들:
+- 조사 결과 평가: {evaluator_responses[0] if len(evaluator_responses) > 0 else 'N/A'}
+- 초기 구현 평가: {evaluator_responses[1] if len(evaluator_responses) > 1 else 'N/A'}
+"""
         return f"""당신은 전체 협력 과정과 결과를 평가하는 평가자 AI입니다.
 사용자 질문: {user_query}
 감독자 AI의 분석 및 지시:
 - 초기 분석: {supervisor_responses[0]}
+- 실행 지시: {supervisor_responses[1] if len(supervisor_responses) > 1 else 'N/A'}
+- 개선 지시: {supervisor_responses[2] if len(supervisor_responses) > 2 else 'N/A'}
 조사자 AI의 조사 결과:
 {researcher_response}
 실행자 AI의 구현:
 - 초기 구현: {executor_responses[0]}
+- 최종 보고서: {executor_responses[1] if len(executor_responses) > 1 else 'N/A'}
+{evaluator_history}
 위 전체 과정을 평가하여:
 1. **품질 평가**: 각 AI의 답변 품질과 역할 수행도를 평가하세요 (10점 만점)
 2. **협력 효과성**: AI 간 협력이 얼마나 효과적이었는지 평가하세요
             generate_content_config = types.GenerateContentConfig(
                 temperature=0.7,
                 top_p=0.8,
+                max_output_tokens=4096,
                 response_mime_type="text/plain"
             )
             payload = {
                 "model": self.model_id,
                 "messages": full_messages,
+                "max_tokens": 4096,
                 "temperature": 0.7,
                 "top_p": 0.8,
                 "stream": True,
     global internal_history
     if not user_query:
+        return "", "", "", "", "", "❌ 질문을 입력해주세요."
     # LLM 모드 설정
     llm_system.set_llm_mode(llm_mode)
         ):
             supervisor_initial_response += chunk
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{supervisor_initial_response}"
+            yield supervisor_text, "", "", "", "", "🔄 감독자 AI가 분석 중..."
         all_responses["supervisor"].append(supervisor_initial_response)
         # 2단계: 브레이브 검색 수행
         researcher_text = "[웹 검색] 🔍 검색 중...\n"
+        yield supervisor_text, researcher_text, "", "", "", "🔍 웹 검색 수행 중..."
         search_results = {}
         total_search_count = 0
                 search_results[keyword] = results
                 total_search_count += len(results)
                 researcher_text += f"✓ '{keyword}' 검색 완료 ({len(results)}개 결과)\n"
+                yield supervisor_text, researcher_text, "", "", "", f"🔍 '{keyword}' 검색 중..."
             # 동의어로 추가 검색
             synonyms = llm_system.generate_synonyms(keyword)
                     search_results[f"{keyword} ({synonym})"] = syn_results
                     total_search_count += len(syn_results)
                     researcher_text += f"✓ 동의어 '{synonym}' 검색 완료 ({len(syn_results)}개 결과)\n"
+                    yield supervisor_text, researcher_text, "", "", "", f"🔍 동의어 '{synonym}' 검색 중..."
         researcher_text += f"\n📊 총 {total_search_count}개의 검색 결과 수집 완료\n"
         # URL 콘텐츠 가져오기 (상위 3개)
         researcher_text += "\n[콘텐츠 분석] 📖 주요 웹페이지 내용 분석 중...\n"
+        yield supervisor_text, researcher_text, "", "", "", "📖 웹페이지 내용 분석 중..."
         content_analyzed = 0
         for keyword, results in search_results.items():
                         result['content_preview'] = content[:500]  # 미리보기 저장
                         content_analyzed += 1
                         researcher_text += f"✓ 콘텐츠 분석 완료: {url[:50]}...\n"
+                        yield supervisor_text, researcher_text, "", "", "", f"📖 분석 중: {url[:30]}..."
         # 3단계: 조사자 AI가 검색 결과 정리
         researcher_prompt = llm_system.create_researcher_prompt(user_query, supervisor_initial_response, search_results)
         ):
             researcher_response += chunk
             researcher_text = f"[조사 결과 정리] - {datetime.now().strftime('%H:%M:%S')}\n{researcher_response}"
+            yield supervisor_text, researcher_text, "", "", "", "📝 조사자 AI가 정리 중..."
         all_responses["researcher"].append(researcher_response)
+        # 4단계: 평가자 AI가 조사 결과 평가
+        evaluator_research_prompt = f"""당신은 전체 협력 과정과 결과를 평가하는 평가자 AI입니다.
+사용자 질문: {user_query}
+감독자 AI의 초기 분석:
+{supervisor_initial_response}
+조사자 AI의 조사 결과:
+{researcher_response}
+위 조사 결과를 평가하여:
+1. 조사의 충실도와 신뢰성을 평가하세요
+2. 누락된 중요 정보가 있는지 확인하세요
+3. 조사 결과의 활용 가능성을 평가하세요
+4. 개선이 필요한 부분을 구체적으로 제시하세요"""
+        evaluator_research_response = ""
+        evaluator_text = "[조사 결과 평가] 🔄 평가 중...\n"
+        for chunk in llm_system.call_llm_streaming(
+            [{"role": "user", "content": evaluator_research_prompt}],
+            "evaluator"
+        ):
+            evaluator_research_response += chunk
+            evaluator_text = f"[조사 결과 평가] - {datetime.now().strftime('%H:%M:%S')}\n{evaluator_research_response}"
+            yield supervisor_text, researcher_text, "", evaluator_text, "", "📊 평가자 AI가 조사 결과 평가 중..."
+        all_responses["evaluator"].append(evaluator_research_response)
+        # 5단계: 감독자 AI가 평가를 반영한 실행 지시
+        supervisor_execution_prompt = f"""당신은 거시적 관점에서 분석하고 지도하는 감독자 AI입니다.
+사용자 질문: {user_query}
+조사자 AI가 정리한 조사 내용:
+{researcher_response}
+평가자 AI의 조사 결과 평가:
+{evaluator_research_response}
+위 조사 내용과 평가를 기반으로 실행자 AI에게 아주 구체적인 지시를 내려주세요:
+1. 평가자의 피드백을 반영하여 지시를 개선하세요
+2. 조사된 정보를 어떻게 활용할지 명확히 지시하세요
+3. 실행 가능한 단계별 작업을 구체적으로 제시하세요
+4. 예상되는 결과물의 형태를 구체적으로 설명하세요"""
         supervisor_execution_response = ""
         supervisor_text += "\n\n---\n\n[실행 지시] 🔄 생성 중...\n"
             supervisor_execution_response += chunk
             temp_text = f"{all_responses['supervisor'][0]}\n\n---\n\n[실행 지시] - {datetime.now().strftime('%H:%M:%S')}\n{supervisor_execution_response}"
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
+            yield supervisor_text, researcher_text, "", evaluator_text, "", "🎯 감독자 AI가 지시 중..."
         all_responses["supervisor"].append(supervisor_execution_response)
+        # 6단계: 실행자 AI가 조사 내용과 지시를 기반���로 초기 구현
         executor_prompt = llm_system.create_executor_prompt(user_query, supervisor_execution_response, researcher_response)
         executor_response = ""
         ):
             executor_response += chunk
             executor_text = f"[초기 구현] - {datetime.now().strftime('%H:%M:%S')}\n{executor_response}"
+            yield supervisor_text, researcher_text, executor_text, evaluator_text, "", "🔧 실행자 AI가 구현 중..."
         all_responses["executor"].append(executor_response)
+        # 7단계: 평가자 AI가 초기 구현 평가
+        evaluator_execution_prompt = f"""당신은 전체 협력 과정과 결과를 평가하는 평가자 AI입니다.
+사용자 질문: {user_query}
+실행자 AI의 초기 구현:
+{executor_response}
+감독자 AI의 지시사항:
+{supervisor_execution_response}
+위 초기 구현을 평가하여:
+1. 지시사항이 얼마나 잘 반영되었는지 평가하세요
+2. 구현의 실행 가능성과 구체성을 평가하세요
+3. 누락된 중요 요소가 있는지 확인하세요
+4. 개선이 필요한 부분을 구체적으로 제시하세요"""
+        evaluator_execution_response = ""
+        evaluator_text += "\n\n---\n\n[초기 구현 평가] 🔄 평가 중...\n"
+        for chunk in llm_system.call_llm_streaming(
+            [{"role": "user", "content": evaluator_execution_prompt}],
+            "evaluator"
+        ):
+            evaluator_execution_response += chunk
+            temp_text = f"{all_responses['evaluator'][0]}\n\n---\n\n[초기 구현 평가] - {datetime.now().strftime('%H:%M:%S')}\n{evaluator_execution_response}"
+            evaluator_text = f"[조사 결과 평가] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
+            yield supervisor_text, researcher_text, executor_text, evaluator_text, "", "📊 평가자 AI가 구현 평가 중..."
+        all_responses["evaluator"].append(evaluator_execution_response)
+        # 8단계: 감독자 AI가 평가를 반영한 개선 지시
+        supervisor_improvement_prompt = f"""당신은 거시적 관점에서 분석하고 지도하는 감독자 AI입니다.
 사용자 질문: {user_query}
+실행자 AI의 초기 구현:
 {executor_response}
+평가자 AI의 구현 평가:
+{evaluator_execution_response}
+위 평가를 반영하여 최종 보고서 작성을 위한 개선 지시를 내려주세요:
+1. 평가자가 지적한 모든 개선사항을 구체적으로 반영하세요
+2. 추가로 필요한 구체적인 내용을 지시하세요
+3. 최종 보고서의 구조와 포함해야 할 요소를 명확히 제시하세요"""
+        supervisor_improvement_response = ""
+        supervisor_text += "\n\n---\n\n[개선 지시] 🔄 생성 중...\n"
         for chunk in llm_system.call_llm_streaming(
+            [{"role": "user", "content": supervisor_improvement_prompt}],
             "supervisor"
         ):
+            supervisor_improvement_response += chunk
+            temp_text = f"{all_responses['supervisor'][0]}\n\n---\n\n[실행 지시] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['supervisor'][1]}\n\n---\n\n[개선 지시] - {datetime.now().strftime('%H:%M:%S')}\n{supervisor_improvement_response}"
             supervisor_text = f"[초기 분석] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
+            yield supervisor_text, researcher_text, executor_text, evaluator_text, "", "🔄 감독자 AI가 개선 지시 중..."
+        all_responses["supervisor"].append(supervisor_improvement_response)
+        # 9단계: 평가자 AI가 전체 과정 최종 평가
+        evaluator_final_prompt = llm_system.create_evaluator_prompt(
+            user_query,
+            all_responses["supervisor"],
+            all_responses["researcher"][0],
+            all_responses["executor"],
+            all_responses["evaluator"]  # 이전 평가들도 전달
         )
+        evaluator_final_response = ""
+        evaluator_text += "\n\n---\n\n[전체 과정 최종 평가] 🔄 평가 중...\n"
+        for chunk in llm_system.call_llm_streaming(
+            [{"role": "user", "content": evaluator_final_prompt}],
+            "evaluator"
+        ):
+            evaluator_final_response += chunk
+            temp_text = f"{all_responses['evaluator'][0]}\n\n---\n\n[초기 구현 평가] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['evaluator'][1]}\n\n---\n\n[전체 과정 최종 평가] - {datetime.now().strftime('%H:%M:%S')}\n{evaluator_final_response}"
+            evaluator_text = f"[조사 결과 평가] - {datetime.now().strftime('%H:%M:%S')}\n{temp_text}"
+            yield supervisor_text, researcher_text, executor_text, evaluator_text, "", "📊 평가자 AI가 최종 평가 중..."
+        all_responses["evaluator"].append(evaluator_final_response)
+        # 10단계: 실행자 AI 최종 보고서 (모든 피드백 반영)
+        final_executor_prompt = f"""당신은 세부적인 내용을 구현하는 실행자 AI입니다.
+사용자 질문: {user_query}
+조사자 AI의 조사 내용:
+{researcher_response}
+당신의 초기 구현:
+{executor_response}
+감독자 AI의 개선 지시:
+{supervisor_improvement_response}
+평가자 AI의 전체 평가:
+{evaluator_final_response}
+위 모든 피드백을 완전히 반영하여 최종 보고서를 작성하세요:
+1. 모든 개선사항과 지시사항을 빠짐없이 반영하세요
+2. 조사 내용을 최대한 구체적으로 활용하세요
+3. 실행 가능성을 높이는 세부 계획을 포함하세요
+4. 명확한 결론과 다음 단계를 제시하세요
+5. 전문적이고 완성도 높은 최종 보고서 형식으로 작성하세요"""
         final_executor_response = ""
         executor_text += "\n\n---\n\n[최종 보고서] 🔄 작성 중...\n"
             final_executor_response += chunk
             temp_text = f"[초기 구현] - {datetime.now().strftime('%H:%M:%S')}\n{all_responses['executor'][0]}\n\n---\n\n[최종 보고서] - {datetime.now().strftime('%H:%M:%S')}\n{final_executor_response}"
             executor_text = temp_text
+            yield supervisor_text, researcher_text, executor_text, evaluator_text, "", "📄 최종 보고서 작성 중..."
         all_responses["executor"].append(final_executor_response)
         # 최종 결과 생성 (최종 보고서를 메인으로)
         final_summary = f"""## 🎯 최종 종합 보고서
 ### 📌 사용자 질문
 {user_query}
+### 📄 최종 보고서 (실행자 AI - 모든 피드백 반영)
 {final_executor_response}
 ---
 ### 📊 전체 프로세스 평가 (평가자 AI)
+{evaluator_final_response}
 ---
+### 🔍 핵심 조사 결과 (조사자 AI)
+{researcher_response[:800]}...
 ---
+### 📋 프로세스 완료
+- **사용 모델**: {'Gemini 2.5 Pro' if llm_system.use_gemini else '기본 LLM'}
+- **프로세스**: 감독→조사→평가→감독→실행→평가→감독→평가→실행
+- **총 9단계 협력 완료**
+- **생성 시간**: {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}"""
         # 내부 히스토리 업데이트 (UI에는 표시하지 않음)
         internal_history.append((user_query, final_summary))
+        yield supervisor_text, researcher_text, executor_text, evaluator_text, final_summary, "✅ 최종 보고서 완성!"
     except Exception as e:
         error_msg = f"❌ 처리 중 오류: {str(e)}"
+        yield "", "", "", "", error_msg, error_msg
 def clear_all():
     """모든 내용 초기화"""
     global internal_history
     internal_history = []
+    return "", "", "", "", "", "🔄 초기화되었습니다."
 # Gradio 인터페이스
 css = """
     padding-left: 10px !important;
     background-color: #fffbeb !important;
 }
+.final-report-box textarea {
+    border: 2px solid #3b82f6 !important;
+    border-radius: 8px !important;
+    padding: 20px !important;
+    background-color: #eff6ff !important;
+    margin-top: 10px !important;
+    font-size: 16px !important;
+}
 """
+with gr.Blocks(title="협력적 LLM 시스템 - 다단계 평가", theme=gr.themes.Soft(), css=css) as app:
     gr.Markdown(
         f"""
+        # 🤝 협력적 LLM 시스템 (다단계 평가 프로세스)
+        ### 📋 프로세스: 감독(분석) → 조사(검색) → 평가(조사) → 감독(지시) → 실행(초안) → 평가(초안) → 감독(개선) → 평가(최종) → 실행(완성)
         """
     )
             - **평가자 AI**: 전체 과정 평가와 개선점 제시
             ### 🌟 주요 기능
+            - 최대 4096 토큰 지원 (긴 응답 가능)
             - 20개 검색 결과와 동의어 검색
             - 신뢰도 기반 정보 평가
+            - 다단계 평가와 피드백 반영
+            ### 📋 프로세스
+            감독 → 조사 → 평가 → 감독 → 실행 → 평가 → 감독 → 평가 → 실행
             """)
             # LLM 선택 옵션
                 label="상태",
                 interactive=False,
                 value="대기 중...",
+                max_lines=2
+            )
+    # 최종 결과 섹션 추가
+    with gr.Row():
+        with gr.Column():
+            gr.Markdown("### 📊 최종 종합 보고서")
+            final_report = gr.Textbox(
+                label="",
+                lines=25,
+                max_lines=35,
+                interactive=False,
+                value="*최종 보고서가 여기에 표시됩니다.*",
+                elem_classes=["final-report-box"]
             )
     # AI 출력들 - 2x2 그리드
             gr.Markdown("### 🧠 감독자 AI (거시적 분석)")
             supervisor_output = gr.Textbox(
                 label="",
+                lines=12,
+                max_lines=18,
                 interactive=False,
                 elem_classes=["supervisor-box"]
             )
             gr.Markdown("### 🔍 조사자 AI (웹 검색 & 정리)")
             researcher_output = gr.Textbox(
                 label="",
+                lines=12,
+                max_lines=18,
                 interactive=False,
                 elem_classes=["researcher-box"]
             )
             gr.Markdown("### 👁️ 실행자 AI (미시적 구현)")
             executor_output = gr.Textbox(
                 label="",
+                lines=12,
+                max_lines=18,
                 interactive=False,
                 elem_classes=["executor-box"]
             )
             gr.Markdown("### 📊 평가자 AI (전체 평가)")
             evaluator_output = gr.Textbox(
                 label="",
+                lines=12,
+                max_lines=18,
                 interactive=False,
                 elem_classes=["evaluator-box"]
             )
     gr.Examples(
         examples=[
             "기계학습 모델의 성능을 향상시키는 최신 방법은?",
+            "2025년 효과적인 프로젝트 관리 도구와 전략은?",
             "지속 가능한 비즈니스 모델의 최신 트렌드는?",
             "최신 데이터 시각화 도구와 기법은?",
+            "원격 팀의 생산성을 높이는 검증된 방법은?",
+            "스타트업을 위한 효과적인 마케팅 전략은?",
+            "AI 윤리와 규제의 최신 동향은?",
+            "클라우드 네이티브 애플리케이션 개발 모범 사례는?"
         ],
         inputs=user_input,
         label="💡 예제 질문"
     submit_btn.click(
         fn=process_query_streaming,
         inputs=[user_input, llm_mode],
+        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, final_report, status_text]
     ).then(
         fn=lambda: "",
         outputs=[user_input]
     user_input.submit(
         fn=process_query_streaming,
         inputs=[user_input, llm_mode],
+        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, final_report, status_text]
     ).then(
         fn=lambda: "",
         outputs=[user_input]
     clear_btn.click(
         fn=clear_all,
+        outputs=[supervisor_output, researcher_output, executor_output, evaluator_output, final_report, status_text]
     )