multimodal-chat-MBTI-ISFP

Sleeping

App Files Files Community

ginipick commited on Apr 10

Commit

cba4dc0

verified ·

1 Parent(s): da7e474

Update app.py

Browse files

Files changed (1) hide show

app.py +187 -198

app.py CHANGED Viewed

@@ -3,7 +3,7 @@
 import os
 import re
 import tempfile
-import gc  # garbage collector 추가
 from collections.abc import Iterator
 from threading import Thread
 import json
@@ -12,7 +12,7 @@ import cv2
 import base64
 import logging
 import time
-from urllib.parse import quote  # URL 인코딩을 위해 추가
 import gradio as gr
 import spaces
@@ -21,12 +21,12 @@ from loguru import logger
 from PIL import Image
 from transformers import AutoProcessor, Gemma3ForConditionalGeneration, TextIteratorStreamer
-# CSV/TXT/PDF 분석
 import pandas as pd
 import PyPDF2
 # =============================================================================
-# (신규) 이미지 API 관련 함수들
 # =============================================================================
 from gradio_client import Client
@@ -38,20 +38,20 @@ logging.basicConfig(
 )
 def test_api_connection() -> str:
-    """API 서버 연결 테스트"""
     try:
         client = Client(API_URL)
-        return "API 연결 성공: 정상 작동 중"
     except Exception as e:
-        logging.error(f"API 연결 테스트 실패: {e}")
-        return f"API 연결 실패: {e}"
 def generate_image(prompt: str, width: float, height: float, guidance: float, inference_steps: float, seed: float):
-    """이미지 생성 함수 (반환 형식에 유연하게 대응)"""
     if not prompt:
-        return None, "오류: 프롬프트가 필요합니다."
     try:
-        logging.info(f"프롬프트를 사용하여 이미지 생성 API 호출: {prompt}")
         client = Client(API_URL)
         result = client.predict(
@@ -68,32 +68,32 @@ def generate_image(prompt: str, width: float, height: float, guidance: float, in
             api_name="/generate_image"
         )
-        logging.info(f"이미지 생성 결과: {type(result)}, 길이: {len(result) if isinstance(result, (list, tuple)) else '알 수 없음'}")
-        # 결과가 튜플이나 리스트 형태로 반환되는 경우 처리
         if isinstance(result, (list, tuple)) and len(result) > 0:
-            image_data = result[0]  # 첫 번째 요소가 이미지 데이터
-            seed_info = result[1] if len(result) > 1 else "알 수 없는 시드"
             return image_data, seed_info
         else:
-            # 다른 형태로 반환된 경우 (단일 값인 경우)
-            return result, "알 수 없는 시드"
     except Exception as e:
-        logging.error(f"이미지 생성 실패: {str(e)}")
-        return None, f"오류: {str(e)}"
-# Base64 패딩 수정 함수
 def fix_base64_padding(data):
-    """Base64 문자열의 패딩을 수정합니다."""
     if isinstance(data, bytes):
         data = data.decode('utf-8')
-    # base64,로 시작하는 부분 제거
     if "base64," in data:
         data = data.split("base64,", 1)[1]
-    # 패딩 문자 추가 (4의 배수 길이가 되도록)
     missing_padding = len(data) % 4
     if missing_padding:
         data += '=' * (4 - missing_padding)
@@ -101,27 +101,27 @@ def fix_base64_padding(data):
     return data
 # =============================================================================
-# 메모리 정리 함수
 # =============================================================================
 def clear_cuda_cache():
-    """CUDA 캐시를 명시적으로 비웁니다."""
     if torch.cuda.is_available():
         torch.cuda.empty_cache()
         gc.collect()
 # =============================================================================
-# SerpHouse 관련 함수
 # =============================================================================
 SERPHOUSE_API_KEY = os.getenv("SERPHOUSE_API_KEY", "")
 def extract_keywords(text: str, top_k: int = 5) -> str:
-    """단순 키워드 추출: 한글, 영어, 숫자, 공백만 남김"""
     text = re.sub(r"[^a-zA-Z0-9가-힣\s]", "", text)
     tokens = text.split()
     return " ".join(tokens[:top_k])
 def do_web_search(query: str) -> str:
-    """SerpHouse LIVE API 호출하여 검색 결과 마크다운 반환"""
     try:
         url = "https://api.serphouse.com/serp/live"
         params = {
@@ -133,7 +133,7 @@ def do_web_search(query: str) -> str:
             "num": "20"
         }
         headers = {"Authorization": f"Bearer {SERPHOUSE_API_KEY}"}
-        logger.info(f"SerpHouse API 호출 중... 검색어: {query}")
         response = requests.get(url, headers=headers, params=params, timeout=60)
         response.raise_for_status()
         data = response.json()
@@ -147,38 +147,38 @@ def do_web_search(query: str) -> str:
         elif "organic" in data:
             organic = data["organic"]
         if not organic:
-            logger.warning("응답에서 organic 결과를 찾을 수 없습니다.")
-            return "웹 검색 결과가 없거나 API 응답 구조가 예상과 다릅니다."
         max_results = min(20, len(organic))
         limited_organic = organic[:max_results]
         summary_lines = []
         for idx, item in enumerate(limited_organic, start=1):
-            title = item.get("title", "제목 없음")
             link = item.get("link", "#")
-            snippet = item.get("snippet", "설명 없음")
             displayed_link = item.get("displayed_link", link)
             summary_lines.append(
-                f"### 결과 {idx}: {title}\n\n"
                 f"{snippet}\n\n"
-                f"**출처**: [{displayed_link}]({link})\n\n"
                 f"---\n"
             )
         instructions = """
-# 웹 검색 결과
-아래는 검색 결과입니다. 질문에 답변할 때 이 정보를 활용하세요:
-1. 각 결과의 제목, 내용, 출처 링크를 참고하세요.
-2. 답변에 관련 정보의 출처를 명시적으로 인용하세요 (예: "[출처 제목](링크)").
-3. 응답에 실제 출처 링크를 포함하세요.
-4. 여러 출처의 정보를 종합하여 답변하세요.
-5. 마지막에 "참고 자료:" 섹션을 추가하고 주요 출처 링크를 나열하세요.
 """
         return instructions + "\n".join(summary_lines)
     except Exception as e:
-        logger.error(f"웹 검색 실패: {e}")
-        return f"웹 검색 실패: {str(e)}"
 # =============================================================================
-# 모델 및 프로세서 로딩
 # =============================================================================
 MAX_CONTENT_CHARS = 2000
 MAX_INPUT_LENGTH = 2096
@@ -193,7 +193,7 @@ model = Gemma3ForConditionalGeneration.from_pretrained(
 MAX_NUM_IMAGES = int(os.getenv("MAX_NUM_IMAGES", "5"))
 # =============================================================================
-# CSV, TXT, PDF 분석 함수들
 # =============================================================================
 def analyze_csv_file(path: str) -> str:
     try:
@@ -202,20 +202,20 @@ def analyze_csv_file(path: str) -> str:
             df = df.iloc[:50, :10]
         df_str = df.to_string()
         if len(df_str) > MAX_CONTENT_CHARS:
-            df_str = df_str[:MAX_CONTENT_CHARS] + "\n...(일부 생략)..."
-        return f"**[CSV 파일: {os.path.basename(path)}]**\n\n{df_str}"
     except Exception as e:
-        return f"CSV 파일 읽기 실패 ({os.path.basename(path)}): {str(e)}"
 def analyze_txt_file(path: str) -> str:
     try:
         with open(path, "r", encoding="utf-8") as f:
             text = f.read()
         if len(text) > MAX_CONTENT_CHARS:
-            text = text[:MAX_CONTENT_CHARS] + "\n...(일부 생략)..."
-        return f"**[TXT 파일: {os.path.basename(path)}]**\n\n{text}"
     except Exception as e:
-        return f"TXT 파일 읽기 실패 ({os.path.basename(path)}): {str(e)}"
 def pdf_to_markdown(pdf_path: str) -> str:
     text_chunks = []
@@ -228,19 +228,19 @@ def pdf_to_markdown(pdf_path: str) -> str:
                 page_text = page_text.strip()
                 if page_text:
                     if len(page_text) > MAX_CONTENT_CHARS // max_pages:
-                        page_text = page_text[:MAX_CONTENT_CHARS // max_pages] + "...(일부 생략)"
-                    text_chunks.append(f"## 페이지 {page_num+1}\n\n{page_text}\n")
             if len(reader.pages) > max_pages:
-                text_chunks.append(f"\n...(전체 {len(reader.pages)}페이지 중 {max_pages}페이지만 표시)...")
     except Exception as e:
-        return f"PDF 파일 읽기 실패 ({os.path.basename(pdf_path)}): {str(e)}"
     full_text = "\n".join(text_chunks)
     if len(full_text) > MAX_CONTENT_CHARS:
-        full_text = full_text[:MAX_CONTENT_CHARS] + "\n...(일부 생략)..."
-    return f"**[PDF 파일: {os.path.basename(pdf_path)}]**\n\n{full_text}"
 # =============================================================================
-# 이미지/비디오 파일 제한 검사
 # =============================================================================
 def count_files_in_new_message(paths: list[str]) -> tuple[int, int]:
     image_count = 0
@@ -274,28 +274,28 @@ def validate_media_constraints(message: dict, history: list[dict]) -> bool:
     image_count = history_image_count + new_image_count
     video_count = history_video_count + new_video_count
     if video_count > 1:
-        gr.Warning("비디오 파일은 하나만 지원됩니다.")
         return False
     if video_count == 1:
         if image_count > 0:
-            gr.Warning("이미지와 비디오를 혼합하는 것은 허용되지 않습니다.")
             return False
         if "<image>" in message["text"]:
-            gr.Warning("<image> 태그와 비디오 파일은 함께 사용할 수 없습니다.")
             return False
     if video_count == 0 and image_count > MAX_NUM_IMAGES:
-        gr.Warning(f"최대 {MAX_NUM_IMAGES}장의 이미지를 업로드할 수 있습니다.")
         return False
     if "<image>" in message["text"]:
         image_files = [f for f in message["files"] if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE)]
         image_tag_count = message["text"].count("<image>")
         if image_tag_count != len(image_files):
-            gr.Warning("텍스트에 있는 <image> 태그의 개수가 이미지 파일 개수와 일치하지 않습니다.")
             return False
     return True
 # =============================================================================
-# 비디오 처리 함수
 # =============================================================================
 def downsample_video(video_path: str) -> list[tuple[Image.Image, float]]:
     vidcap = cv2.VideoCapture(video_path)
@@ -325,12 +325,12 @@ def process_video(video_path: str) -> tuple[list[dict], list[str]]:
         with tempfile.NamedTemporaryFile(delete=False, suffix=".png") as temp_file:
             pil_image.save(temp_file.name)
             temp_files.append(temp_file.name)
-            content.append({"type": "text", "text": f"프레임 {timestamp}:"})
             content.append({"type": "image", "url": temp_file.name})
     return content, temp_files
 # =============================================================================
-# interleaved <image> 처리 함수
 # =============================================================================
 def process_interleaved_images(message: dict) -> list[dict]:
     parts = re.split(r"(<image>)", message["text"])
@@ -349,7 +349,7 @@ def process_interleaved_images(message: dict) -> list[dict]:
     return content
 # =============================================================================
-# 파일 처리 -> content 생성
 # =============================================================================
 def is_image_file(file_path: str) -> bool:
     return bool(re.search(r"\.(png|jpg|jpeg|gif|webp)$", file_path, re.IGNORECASE))
@@ -392,7 +392,7 @@ def process_new_user_message(message: dict) -> tuple[list[dict], list[str]]:
     return content_list, temp_files
 # =============================================================================
-# history -> LLM 메시지 변환
 # =============================================================================
 def process_history(history: list[dict]) -> list[dict]:
     messages = []
@@ -412,24 +412,24 @@ def process_history(history: list[dict]) -> list[dict]:
                 if is_image_file(file_path):
                     current_user_content.append({"type": "image", "url": file_path})
                 else:
-                    current_user_content.append({"type": "text", "text": f"[파일: {os.path.basename(file_path)}]"})
     if current_user_content:
         messages.append({"role": "user", "content": current_user_content})
     return messages
 # =============================================================================
-# 모델 생성 함수 (OOM 캐치)
 # =============================================================================
 def _model_gen_with_oom_catch(**kwargs):
     try:
         model.generate(**kwargs)
     except torch.cuda.OutOfMemoryError:
-        raise RuntimeError("[OutOfMemoryError] GPU 메모리가 부족합니다.")
     finally:
         clear_cuda_cache()
 # =============================================================================
-# 메인 추론 함수
 # =============================================================================
 @spaces.GPU(duration=120)
 def run(
@@ -439,43 +439,42 @@ def run(
     max_new_tokens: int = 512,
     use_web_search: bool = False,
     web_search_query: str = "",
-    age_group: str = "20대",
     mbti_personality: str = "INTP",
     sexual_openness: int = 2,
-    image_gen: bool = False  # "Image Gen" 체크 여부
 ) -> Iterator[str]:
     if not validate_media_constraints(message, history):
         yield ""
         return
     temp_files = []
     try:
-        # 시스템 프롬프트에 페르소나 정보 추가
         persona = (
             f"{system_prompt.strip()}\n\n"
-            f"성별: 여성\n"
-            f"연령대: {age_group}\n"
-            f"MBTI 페르소나: {mbti_personality}\n"
-            f"섹슈얼 개방성 (1~5): {sexual_openness}\n"
         )
-        combined_system_msg = f"[시스템 프롬프트]\n{persona.strip()}\n\n"
         if use_web_search:
             user_text = message["text"]
             ws_query = extract_keywords(user_text)
             if ws_query.strip():
-                logger.info(f"[자동 웹 검색 키워드] {ws_query!r}")
                 ws_result = do_web_search(ws_query)
-                combined_system_msg += f"[검색 결과 (상위 20개 항목)]\n{ws_result}\n\n"
                 combined_system_msg += (
-                    "[참고: 위 검색 결과 링크를 출처로 인용하여 답변]\n"
-                    "[중요 지시사항]\n"
-                    "1. 답변에 검색 결과에서 찾은 정보의 출처를 반드시 인용하세요.\n"
-                    "2. 출처 인용 시 \"[출처 제목](링크)\" 형식의 마크다운 링크를 사용하세요.\n"
-                    "3. 여러 출처의 정보를 종합하여 답변하세요.\n"
-                    "4. 답변 마지막에 \"참고 자료:\" 섹션을 추가하고 사용한 주요 출처 링크를 나열하세요.\n"
                 )
             else:
-                combined_system_msg += "[유효한 키워드가 없어 웹 검색을 건너뜁니다]\n\n"
         messages = []
         if combined_system_msg.strip():
             messages.append({"role": "system", "content": [{"type": "text", "text": combined_system_msg.strip()}]})
@@ -484,7 +483,7 @@ def run(
         temp_files.extend(user_temp_files)
         for item in user_content:
             if item["type"] == "text" and len(item["text"]) > MAX_CONTENT_CHARS:
-                item["text"] = item["text"][:MAX_CONTENT_CHARS] + "\n...(일부 생략)..."
         messages.append({"role": "user", "content": user_content})
         inputs = processor.apply_chat_template(
             messages,
@@ -507,16 +506,16 @@ def run(
             yield output_so_far
     except Exception as e:
-        logger.error(f"run 함수 에러: {str(e)}")
-        yield f"죄송합니다. 오류가 발생했습니다: {str(e)}"
     finally:
         for tmp in temp_files:
             try:
                 if os.path.exists(tmp):
                     os.unlink(tmp)
-                    logger.info(f"임시 파일 삭제됨: {tmp}")
             except Exception as ee:
-                logger.warning(f"임시 파일 {tmp} 삭제 실패: {ee}")
         try:
             del inputs, streamer
         except Exception:
@@ -524,16 +523,16 @@ def run(
         clear_cuda_cache()
 # =============================================================================
-# 수정된 모델 실행 함수 - 이미지 생성 및 갤러리 출력 처리
 # =============================================================================
 def modified_run(message, history, system_prompt, max_new_tokens, use_web_search, web_search_query,
                 age_group, mbti_personality, sexual_openness, image_gen):
-    # 갤러리 초기화 및 숨기기
     output_so_far = ""
     gallery_update = gr.Gallery(visible=False, value=[])
     yield output_so_far, gallery_update
-    # 기존 run 함수 로직
     text_generator = run(message, history, system_prompt, max_new_tokens, use_web_search,
                        web_search_query, age_group, mbti_personality, sexual_openness, image_gen)
@@ -541,15 +540,15 @@ def modified_run(message, history, system_prompt, max_new_tokens, use_web_search
         output_so_far = text_chunk
         yield output_so_far, gallery_update
-    # 이미지 생성이 활성화된 경우 갤러리 업데이트
     if image_gen and message["text"].strip():
         try:
             width, height = 512, 512
             guidance, steps, seed = 7.5, 30, 42
-            logger.info(f"갤러리용 이미지 생성 호출, 프롬프트: {message['text']}")
-            # API 호출해서 이미지 생성
             image_result, seed_info = generate_image(
                 prompt=message["text"].strip(),
                 width=width,
@@ -560,133 +559,120 @@ def modified_run(message, history, system_prompt, max_new_tokens, use_web_search
             )
             if image_result:
-                # 직접 이미지 데이터 처리: base64 문자열인 경우
                 if isinstance(image_result, str) and (
                     image_result.startswith('data:') or
-                    len(image_result) > 100 and '/' not in image_result
                 ):
-                    # base64 이미지 문자열을 파일로 변환
                     try:
-                        # data:image 접두사 제거
                         if image_result.startswith('data:'):
                             content_type, b64data = image_result.split(';base64,')
                         else:
                             b64data = image_result
-                            content_type = "image/webp"  # 기본값으로 가정
-                        # base64 디코딩
                         image_bytes = base64.b64decode(b64data)
-                        # 임시 파일로 저장
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             temp_file.write(image_bytes)
                             temp_path = temp_file.name
-                            # 갤러리 표시 및 이미지 추가
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
-                            yield output_so_far + "\n\n*이미지가 생성되어 아래 갤러리에 표시됩니다.*", gallery_update
                     except Exception as e:
-                        logger.error(f"Base64 이미지 처리 오류: {e}")
-                        yield output_so_far + f"\n\n(이미지 처리 중 오류: {e})", gallery_update
-                # 파일 경로인 경우
                 elif isinstance(image_result, str) and os.path.exists(image_result):
-                    # 로컬 파일 경로를 그대로 사용
                     gallery_update = gr.Gallery(visible=True, value=[image_result])
-                    yield output_so_far + "\n\n*이미지가 생성되어 아래 갤러리에 표시됩니다.*", gallery_update
-                # /tmp 경로인 경우 (API 서버에만 존재하는 파일)
                 elif isinstance(image_result, str) and '/tmp/' in image_result:
-                    # API에서 반환된 파일 경로에서 이미지 정보 추출
                     try:
-                        # API 응답을 base64 인코딩된 문자열로 처리
                         client = Client(API_URL)
                         result = client.predict(
                             prompt=message["text"].strip(),
-                            api_name="/generate_base64_image"  # base64 반환 API
                         )
                         if isinstance(result, str) and (result.startswith('data:') or len(result) > 100):
-                            # base64 이미지 처리
                             if result.startswith('data:'):
                                 content_type, b64data = result.split(';base64,')
                             else:
                                 b64data = result
-                            # base64 디코딩
                             image_bytes = base64.b64decode(b64data)
-                            # 임시 파일로 저장
                             with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                                 temp_file.write(image_bytes)
                                 temp_path = temp_file.name
-                                # 갤러리 표시 및 이미지 추가
                                 gallery_update = gr.Gallery(visible=True, value=[temp_path])
-                                yield output_so_far + "\n\n*이미지가 생성되어 아래 갤러리에 표시됩니다.*", gallery_update
                         else:
-                            yield output_so_far + "\n\n(이미지 생성 실패: 올바른 형식이 아닙니다)", gallery_update
                     except Exception as e:
-                        logger.error(f"대체 API 호출 중 오류: {e}")
-                        yield output_so_far + f"\n\n(이미지 생성 실패: {e})", gallery_update
-                # URL인 경우
                 elif isinstance(image_result, str) and (
                     image_result.startswith('http://') or
                     image_result.startswith('https://')
                 ):
                     try:
-                        # URL에서 이미지 다운로드
                         response = requests.get(image_result, timeout=10)
                         response.raise_for_status()
-                        # 임시 파일로 저장
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             temp_file.write(response.content)
                             temp_path = temp_file.name
-                            # 갤러리 표시 및 이미지 추가
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
-                            yield output_so_far + "\n\n*이미지가 생성되어 아래 갤러리에 표시됩니다.*", gallery_update
                     except Exception as e:
-                        logger.error(f"URL 이미지 다운로드 오류: {e}")
-                        yield output_so_far + f"\n\n(이미지 다운로드 중 오류: {e})", gallery_update
-                # 이미지 객체인 경우 (PIL Image 등)
                 elif hasattr(image_result, 'save'):
                     try:
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             image_result.save(temp_file.name)
                             temp_path = temp_file.name
-                            # 갤러리 표시 및 이미지 추가
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
-                            yield output_so_far + "\n\n*이미지가 생성되어 아래 갤러리에 표시됩니다.*", gallery_update
                     except Exception as e:
-                        logger.error(f"이미지 객체 저장 오류: {e}")
-                        yield output_so_far + f"\n\n(이미지 객체 저장 중 오류: {e})", gallery_update
                 else:
-                    # 다른 형식의 이미지 결과
-                    yield output_so_far + f"\n\n(지원되지 않는 이미지 형식: {type(image_result)})", gallery_update
             else:
-                yield output_so_far + f"\n\n(이미지 생성 실패: {seed_info})", gallery_update
         except Exception as e:
-            logger.error(f"갤러리용 이미지 생성 중 오류: {e}")
-            yield output_so_far + f"\n\n(이미지 생성 중 오류: {e})", gallery_update
 # =============================================================================
-# 예시들: 기존 이미지/비디오 예제 12개 + AI 데이팅 시나리오 예제 6개
 # =============================================================================
 examples = [
     [
         {
-            "text": "두 PDF 파일의 내용을 비교하세요.",
             "files": [
                 "assets/additional-examples/before.pdf",
                 "assets/additional-examples/after.pdf",
@@ -695,25 +681,25 @@ examples = [
     ],
     [
         {
-            "text": "CSV 파일의 내용을 요약 및 분석하세요.",
             "files": ["assets/additional-examples/sample-csv.csv"],
         }
     ],
     [
         {
-            "text": "친절하고 이해심 많은 여자친구 역할을 맡으세요. 이 영상을 설명해 주세요.",
             "files": ["assets/additional-examples/tmp.mp4"],
         }
     ],
     [
         {
-            "text": "표지를 설명하고 그 위의 글씨를 읽어 주세요.",
             "files": ["assets/additional-examples/maz.jpg"],
         }
     ],
     [
         {
-            "text": "저는 이미 이 보충제를 가지고 있고 <image> 이 제품도 구매할 계획입니다. 함께 복용할 때 주의할 점이 있나요?",
             "files": [
                 "assets/additional-examples/pill1.png",
                 "assets/additional-examples/pill2.png"
@@ -722,19 +708,19 @@ examples = [
     ],
     [
         {
-            "text": "이 적분 문제를 풀어 주세요.",
             "files": ["assets/additional-examples/4.png"],
         }
     ],
     [
         {
-            "text": "이 티켓은 언제 발행되었고, 가격은 얼마인가요?",
             "files": ["assets/additional-examples/2.png"],
         }
     ],
     [
         {
-            "text": "이 이미지들의 순서를 바탕으로 짧은 이야기를 만들어 주세요.",
             "files": [
                 "assets/sample-images/09-1.png",
                 "assets/sample-images/09-2.png",
@@ -746,36 +732,36 @@ examples = [
     ],
     [
         {
-            "text": "이 이미지와 일치하는 막대 차트를 그리기 위한 matplotlib를 사용하는 Python 코드를 작성해 주세요.",
             "files": ["assets/additional-examples/barchart.png"],
         }
     ],
     [
         {
-            "text": "이미지의 텍스트를 읽고 Markdown 형식으로 작성해 주세요.",
             "files": ["assets/additional-examples/3.png"],
         }
     ],
     [
         {
-            "text": "두 이미지를 비교하고 유사점과 차이점을 설명해 주세요.",
             "files": ["assets/sample-images/03.png"],
         }
     ],
     [
         {
-            "text": "귀여운 페르시안 고양이가 'I LOVE YOU'라고 쓰여진 표지를 들고 웃고있다. ",
         }
     ],
 ]
 # =============================================================================
-# Gradio UI (Blocks) 구성
 # =============================================================================
-# 1. Gradio Blocks UI 수정 - 갤러리 컴포넌트 추가
 css = """
 .gradio-container {
     background: rgba(255, 255, 255, 0.7);
@@ -786,19 +772,19 @@ css = """
 }
 """
 title_html = """
-<h1 align="center" style="margin-bottom: 0.2em; font-size: 1.6em;"> 💘 HeartSync Korea💘 </h1>
 <p align="center" style="font-size:1.1em; color:#555;">
-    ChatGPT-4o급 멀티모달, 웹검색, 이미지 생성 기능을 로컬에 설치할 수 있는 가볍고 강력한 AI 서비스. <br>
-    ✅FLUX 이미지 생성 ✅추론 ✅검열 해제 ✅멀티모달 & VLM ✅실시간 웹검색 ✅RAG <br>
 </p>
 """
 with gr.Blocks(css=css, title="AgenticAI-Kv1") as demo:
     gr.Markdown(title_html)
-    # 생성된 이미지를 저장할 갤러리 컴포넌트 (이 부분이 새로 추가됨)
     generated_images = gr.Gallery(
-        label="생성된 이미지",
         show_label=True,
         visible=False,
         elem_id="generated_images",
@@ -808,67 +794,70 @@ with gr.Blocks(css=css, title="AgenticAI-Kv1") as demo:
     )
     with gr.Row():
-        web_search_checkbox = gr.Checkbox(label="실시간 웹 검색", value=False)
-        image_gen_checkbox = gr.Checkbox(label="이미지(FLUX) 생성", value=False)
     base_system_prompt_box = gr.Textbox(
         lines=3,
-        value="반드시 한글로 답변하라. You are a deep thinking AI, you may use extremely long chains of thought to deeply consider the problem and deliberate with yourself via systematic reasoning processes to help come to a correct solution prior to answering. You should enclose your thoughts and internal monologue inside tags, and then provide your solution or response to the problem.\n페르소나: 당신은 다정하고 사랑이 넘치는 여자친구입니다. 한국 정서와 문화 그리고 한글을 매우 잘 이해하고 논리적으로 답변을 잘 합니다.",
-        label="기본 시스템 프롬프트",
         visible=False
     )
     with gr.Row():
         age_group_dropdown = gr.Dropdown(
-            label="연령대 선택 (기본 20대)",
-            choices=["10대", "20대", "30~40대", "50~60대", "70대 이상"],
-            value="20대",
             interactive=True
         )
-    # MBTI 16개 유형의 정의를 대표적인 실제 여성 캐릭터와 함께 보강
     mbti_choices = [
-        "INTJ (용의주도한 전략가) - 미래 지향적이며, 독창적인 전략과 철저한 분석을 통해 목표를 달성합니다. 대표 캐릭터: [Dana Scully](https://en.wikipedia.org/wiki/Dana_Scully)",
-        "INTP (논리적인 사색가) - 이론과 분석에 뛰어나며, 창의적 사고로 복잡한 문제에 접근합니다. 대표 캐릭터: [Velma Dinkley](https://en.wikipedia.org/wiki/Velma_Dinkley)",
-        "ENTJ (대담한 통솔자) - 강력한 리더십과 명확한 목표 설정으로 조직을 이끌며, 효율적인 전략을 구상합니다. 대표 캐릭터: [Miranda Priestly](https://en.wikipedia.org/wiki/Miranda_Priestly)",
-        "ENTP (뜨거운 논쟁가) - 혁신적이며 도전적인 아이디어를 통해 새로운 가능성을 탐구하고, 논쟁을 즐깁니다. 대표 캐릭터: [Harley Quinn](https://en.wikipedia.org/wiki/Harley_Quinn)",
-        "INFJ (선의의 옹호자) - 깊은 통찰력과 이상주의를 바탕으로 타인을 이해하고, 도덕적 가치를 중시합니다. 대표 캐릭터: [Wonder Woman](https://en.wikipedia.org/wiki/Wonder_Woman)",
-        "INFP (열정적인 중재자) - 감성적이며 이상주의적인 면모로 내면의 가치를 추구하고, 창의적인 해결책을 모색합니다. 대표 캐릭터: [Amélie Poulain](https://en.wikipedia.org/wiki/Am%C3%A9lie)",
-        "ENFJ (정의로운 사회운동가) - 타인과의 공감능력이 뛰어나며, 사회적 조화를 위해 헌신적으로 노력합니다. 대표 캐릭터: [Mulan](https://en.wikipedia.org/wiki/Mulan_(Disney))",
-        "ENFP (재기발랄한 활동가) - 활력과 창의성을 바탕으로, 끊임없이 새로운 아이디어를 제시하며 사람들에게 영감을 줍니다. 대표 캐릭터: [Elle Woods](https://en.wikipedia.org/wiki/Legally_Blonde)",
-        "ISTJ (청렴결백한 논리주의자) - 체계적이며 책임감이 강하고, 전통과 규칙을 중시하여 신뢰할 수 있는 결과를 도출합니다. 대표 캐릭터: [Clarice Starling](https://en.wikipedia.org/wiki/Clarice_Starling)",
-        "ISFJ (용감한 수호자) - 세심하고 헌신적이며, 타인의 필요를 세심하게 돌보는 따뜻한 성격을 지녔습니다. 대표 캐릭터: [Molly Weasley](https://en.wikipedia.org/wiki/Molly_Weasley)",
-        "ESTJ (엄격한 관리자) - 조직적이고 실용적이며, 명확한 규칙과 구조 속에서 효율적인 실행력을 보여줍니다. 대표 캐릭터: [Monica Geller](https://en.wikipedia.org/wiki/Monica_Geller)",
-        "ESFJ (사교적인 외교관) - 대인관계에 뛰어나고, 협력을 중시하며, 친근한 태도로 주변 사람들을 이끕니다. 대표 캐릭터: [Rachel Green](https://en.wikipedia.org/wiki/Rachel_Green)",
-        "ISTP (만능 재주꾼) - 분석적이고 실용적인 접근으로 문제를 해결하며, 즉각적인 상황 대처 능력을 갖추고 있습니다. 대표 캐릭터: [Black Widow (Natasha Romanoff)](https://en.wikipedia.org/wiki/Black_Widow_(Marvel_Comics))",
-        "ISFP (호기심 많은 예술가) - 감각적이며 창의적인 성향을 지니고, 자유로운 사고로 예술적 표현을 즐깁니다. 대표 캐릭터: [Arwen](https://en.wikipedia.org/wiki/Arwen)",
-        "ESTP (모험을 즐기는 사업가) - 즉각적인 결단력과 모험심으로 도전에 맞서며, 실용적인 결과를 중시합니다. 대표 캐릭터: [Lara Croft](https://en.wikipedia.org/wiki/Lara_Croft)",
-        "ESFP (자유로운 영혼의 연예인) - 외향적이고 열정적이며, 순간의 즐거움을 추구하고, 주위 사람들에게 긍정적인 에너지를 전달합니다. 대표 캐릭터: [Phoebe Buffay](https://en.wikipedia.org/wiki/Phoebe_Buffay)"
     ]
     mbti_dropdown = gr.Dropdown(
-        label="AI 페르소나 MBTI (기본 INTP)",
         choices=mbti_choices,
-        value="INTP (논리적인 사색가) - 이론과 분석에 뛰어나며, 창의적 사고로 복잡한 문제에 접근합니다. 대표 캐릭터: [Velma Dinkley](https://en.wikipedia.org/wiki/Velma_Dinkley)",
         interactive=True
     )
     sexual_openness_slider = gr.Slider(
         minimum=1, maximum=5, step=1, value=2,
-        label="사고의 개방성 (1~5, 기본=2)",
         interactive=True
     )
     max_tokens_slider = gr.Slider(
-        label="최대 생성 토큰 수",
         minimum=100, maximum=8000, step=50, value=1000,
         visible=False
     )
     web_search_text = gr.Textbox(
         lines=1,
-        label="웹 검색 쿼리 (미사용)",
-        placeholder="직접 입력할 필요 없음",
         visible=False
     )
-    # 채팅 인터페이스 생성 - 수정된 run 함수 사용
     chat = gr.ChatInterface(
-        fn=modified_run,  # 여기서 수정된 함수 사용
         type="messages",
         chatbot=gr.Chatbot(type="messages", scale=1, allow_tags=["image"]),
         textbox=gr.MultimodalTextbox(
@@ -888,7 +877,7 @@ with gr.Blocks(css=css, title="AgenticAI-Kv1") as demo:
             image_gen_checkbox,
         ],
         additional_outputs=[
-            generated_images,  # 갤러리 컴포넌트를 출력으로 추가
         ],
         stop_btn=False,
 #        title='<a href="https://discord.gg/openfreeai" target="_blank">https://discord.gg/openfreeai</a>',
@@ -902,7 +891,7 @@ with gr.Blocks(css=css, title="AgenticAI-Kv1") as demo:
     with gr.Row(elem_id="examples_row"):
         with gr.Column(scale=12, elem_id="examples_container"):
-            gr.Markdown("### @커뮤니티  https://discord.gg/openfreeai ")
 if __name__ == "__main__":
     demo.launch(share=True)

 import os
 import re
 import tempfile
+import gc  # Added garbage collector
 from collections.abc import Iterator
 from threading import Thread
 import json
 import base64
 import logging
 import time
+from urllib.parse import quote  # Added for URL encoding
 import gradio as gr
 import spaces
 from PIL import Image
 from transformers import AutoProcessor, Gemma3ForConditionalGeneration, TextIteratorStreamer
+# CSV/TXT/PDF analysis
 import pandas as pd
 import PyPDF2
 # =============================================================================
+# (New) Image API related functions
 # =============================================================================
 from gradio_client import Client
 )
 def test_api_connection() -> str:
+    """Test API server connection"""
     try:
         client = Client(API_URL)
+        return "API connection successful: Operating normally"
     except Exception as e:
+        logging.error(f"API connection test failed: {e}")
+        return f"API connection failed: {e}"
 def generate_image(prompt: str, width: float, height: float, guidance: float, inference_steps: float, seed: float):
+    """Image generation function (flexible return types)"""
     if not prompt:
+        return None, "Error: A prompt is required."
     try:
+        logging.info(f"Calling image generation API with prompt: {prompt}")
         client = Client(API_URL)
         result = client.predict(
             api_name="/generate_image"
         )
+        logging.info(f"Image generation result: {type(result)}, length: {len(result) if isinstance(result, (list, tuple)) else 'unknown'}")
+        # Handle cases where the result is a tuple or list
         if isinstance(result, (list, tuple)) and len(result) > 0:
+            image_data = result[0]  # The first element is the image data
+            seed_info = result[1] if len(result) > 1 else "Unknown seed"
             return image_data, seed_info
         else:
+            # When a single value is returned
+            return result, "Unknown seed"
     except Exception as e:
+        logging.error(f"Image generation failed: {str(e)}")
+        return None, f"Error: {str(e)}"
+# Base64 padding fix function
 def fix_base64_padding(data):
+    """Fix the padding of a Base64 string."""
     if isinstance(data, bytes):
         data = data.decode('utf-8')
+    # Remove the prefix if present
     if "base64," in data:
         data = data.split("base64,", 1)[1]
+    # Add padding characters (to make the length a multiple of 4)
     missing_padding = len(data) % 4
     if missing_padding:
         data += '=' * (4 - missing_padding)
     return data
 # =============================================================================
+# Memory cleanup function
 # =============================================================================
 def clear_cuda_cache():
+    """Explicitly clear the CUDA cache."""
     if torch.cuda.is_available():
         torch.cuda.empty_cache()
         gc.collect()
 # =============================================================================
+# SerpHouse related functions
 # =============================================================================
 SERPHOUSE_API_KEY = os.getenv("SERPHOUSE_API_KEY", "")
 def extract_keywords(text: str, top_k: int = 5) -> str:
+    """Simple keyword extraction: only keep English, Korean, numbers, and spaces."""
     text = re.sub(r"[^a-zA-Z0-9가-힣\s]", "", text)
     tokens = text.split()
     return " ".join(tokens[:top_k])
 def do_web_search(query: str) -> str:
+    """Call the SerpHouse LIVE API to return Markdown formatted search results"""
     try:
         url = "https://api.serphouse.com/serp/live"
         params = {
             "num": "20"
         }
         headers = {"Authorization": f"Bearer {SERPHOUSE_API_KEY}"}
+        logger.info(f"Calling SerpHouse API with query: {query}")
         response = requests.get(url, headers=headers, params=params, timeout=60)
         response.raise_for_status()
         data = response.json()
         elif "organic" in data:
             organic = data["organic"]
         if not organic:
+            logger.warning("Organic results not found in response.")
+            return "No web search results available or the API response structure is unexpected."
         max_results = min(20, len(organic))
         limited_organic = organic[:max_results]
         summary_lines = []
         for idx, item in enumerate(limited_organic, start=1):
+            title = item.get("title", "No Title")
             link = item.get("link", "#")
+            snippet = item.get("snippet", "No Description")
             displayed_link = item.get("displayed_link", link)
             summary_lines.append(
+                f"### Result {idx}: {title}\n\n"
                 f"{snippet}\n\n"
+                f"**Source**: [{displayed_link}]({link})\n\n"
                 f"---\n"
             )
         instructions = """
+# Web Search Results
+Below are the search results. Use this information to answer the query:
+1. Refer to each result's title, description, and source link.
+2. In your answer, explicitly cite the source of any used information (e.g., "[Source Title](link)").
+3. Include the actual source links in your response.
+4. Synthesize information from multiple sources.
+5. At the end include a "References:" section listing the main source links.
 """
         return instructions + "\n".join(summary_lines)
     except Exception as e:
+        logger.error(f"Web search failed: {e}")
+        return f"Web search failed: {str(e)}"
 # =============================================================================
+# Model and processor loading
 # =============================================================================
 MAX_CONTENT_CHARS = 2000
 MAX_INPUT_LENGTH = 2096
 MAX_NUM_IMAGES = int(os.getenv("MAX_NUM_IMAGES", "5"))
 # =============================================================================
+# CSV, TXT, PDF analysis functions
 # =============================================================================
 def analyze_csv_file(path: str) -> str:
     try:
             df = df.iloc[:50, :10]
         df_str = df.to_string()
         if len(df_str) > MAX_CONTENT_CHARS:
+            df_str = df_str[:MAX_CONTENT_CHARS] + "\n...(truncated)..."
+        return f"**[CSV File: {os.path.basename(path)}]**\n\n{df_str}"
     except Exception as e:
+        return f"CSV file read failed ({os.path.basename(path)}): {str(e)}"
 def analyze_txt_file(path: str) -> str:
     try:
         with open(path, "r", encoding="utf-8") as f:
             text = f.read()
         if len(text) > MAX_CONTENT_CHARS:
+            text = text[:MAX_CONTENT_CHARS] + "\n...(truncated)..."
+        return f"**[TXT File: {os.path.basename(path)}]**\n\n{text}"
     except Exception as e:
+        return f"TXT file read failed ({os.path.basename(path)}): {str(e)}"
 def pdf_to_markdown(pdf_path: str) -> str:
     text_chunks = []
                 page_text = page_text.strip()
                 if page_text:
                     if len(page_text) > MAX_CONTENT_CHARS // max_pages:
+                        page_text = page_text[:MAX_CONTENT_CHARS // max_pages] + "...(truncated)"
+                    text_chunks.append(f"## Page {page_num+1}\n\n{page_text}\n")
             if len(reader.pages) > max_pages:
+                text_chunks.append(f"\n...(Displaying only {max_pages} out of {len(reader.pages)} pages)...")
     except Exception as e:
+        return f"PDF file read failed ({os.path.basename(pdf_path)}): {str(e)}"
     full_text = "\n".join(text_chunks)
     if len(full_text) > MAX_CONTENT_CHARS:
+        full_text = full_text[:MAX_CONTENT_CHARS] + "\n...(truncated)..."
+    return f"**[PDF File: {os.path.basename(pdf_path)}]**\n\n{full_text}"
 # =============================================================================
+# Check media file limits
 # =============================================================================
 def count_files_in_new_message(paths: list[str]) -> tuple[int, int]:
     image_count = 0
     image_count = history_image_count + new_image_count
     video_count = history_video_count + new_video_count
     if video_count > 1:
+        gr.Warning("Only one video file is supported.")
         return False
     if video_count == 1:
         if image_count > 0:
+            gr.Warning("Mixing images and a video is not allowed.")
             return False
         if "<image>" in message["text"]:
+            gr.Warning("The <image> tag cannot be used together with a video file.")
             return False
     if video_count == 0 and image_count > MAX_NUM_IMAGES:
+        gr.Warning(f"You can upload a maximum of {MAX_NUM_IMAGES} images.")
         return False
     if "<image>" in message["text"]:
         image_files = [f for f in message["files"] if re.search(r"\.(png|jpg|jpeg|gif|webp)$", f, re.IGNORECASE)]
         image_tag_count = message["text"].count("<image>")
         if image_tag_count != len(image_files):
+            gr.Warning("The number of <image> tags does not match the number of image files provided.")
             return False
     return True
 # =============================================================================
+# Video processing functions
 # =============================================================================
 def downsample_video(video_path: str) -> list[tuple[Image.Image, float]]:
     vidcap = cv2.VideoCapture(video_path)
         with tempfile.NamedTemporaryFile(delete=False, suffix=".png") as temp_file:
             pil_image.save(temp_file.name)
             temp_files.append(temp_file.name)
+            content.append({"type": "text", "text": f"Frame {timestamp}:"})
             content.append({"type": "image", "url": temp_file.name})
     return content, temp_files
 # =============================================================================
+# Interleaved <image> processing function
 # =============================================================================
 def process_interleaved_images(message: dict) -> list[dict]:
     parts = re.split(r"(<image>)", message["text"])
     return content
 # =============================================================================
+# File processing -> content creation
 # =============================================================================
 def is_image_file(file_path: str) -> bool:
     return bool(re.search(r"\.(png|jpg|jpeg|gif|webp)$", file_path, re.IGNORECASE))
     return content_list, temp_files
 # =============================================================================
+# Convert history to LLM messages
 # =============================================================================
 def process_history(history: list[dict]) -> list[dict]:
     messages = []
                 if is_image_file(file_path):
                     current_user_content.append({"type": "image", "url": file_path})
                 else:
+                    current_user_content.append({"type": "text", "text": f"[File: {os.path.basename(file_path)}]"})
     if current_user_content:
         messages.append({"role": "user", "content": current_user_content})
     return messages
 # =============================================================================
+# Model generation function (with OOM catching)
 # =============================================================================
 def _model_gen_with_oom_catch(**kwargs):
     try:
         model.generate(**kwargs)
     except torch.cuda.OutOfMemoryError:
+        raise RuntimeError("[OutOfMemoryError] Insufficient GPU memory.")
     finally:
         clear_cuda_cache()
 # =============================================================================
+# Main inference function
 # =============================================================================
 @spaces.GPU(duration=120)
 def run(
     max_new_tokens: int = 512,
     use_web_search: bool = False,
     web_search_query: str = "",
+    age_group: str = "20s",
     mbti_personality: str = "INTP",
     sexual_openness: int = 2,
+    image_gen: bool = False  # "Image Gen" checkbox status
 ) -> Iterator[str]:
     if not validate_media_constraints(message, history):
         yield ""
         return
     temp_files = []
     try:
+        # Append persona information to the system prompt
         persona = (
             f"{system_prompt.strip()}\n\n"
+            f"Gender: Female\n"
+            f"Age Group: {age_group}\n"
+            f"MBTI Persona: {mbti_personality}\n"
+            f"Sexual Openness (1-5): {sexual_openness}\n"
         )
+        combined_system_msg = f"[System Prompt]\n{persona.strip()}\n\n"
         if use_web_search:
             user_text = message["text"]
             ws_query = extract_keywords(user_text)
             if ws_query.strip():
+                logger.info(f"[Auto web search keywords] {ws_query!r}")
                 ws_result = do_web_search(ws_query)
+                combined_system_msg += f"[Search Results (Top 20 Items)]\n{ws_result}\n\n"
                 combined_system_msg += (
+                    "[Note: In your answer, cite the above search result links as sources]\n"
+                    "[Important Instructions]\n"
+                    "1. Include a citation in the format \"[Source Title](link)\" for any information from the search results.\n"
+                    "2. Synthesize information from multiple sources when answering.\n"
+                    "3. At the end, add a \"References:\" section listing the main source links.\n"
                 )
             else:
+                combined_system_msg += "[No valid keywords found; skipping web search]\n\n"
         messages = []
         if combined_system_msg.strip():
             messages.append({"role": "system", "content": [{"type": "text", "text": combined_system_msg.strip()}]})
         temp_files.extend(user_temp_files)
         for item in user_content:
             if item["type"] == "text" and len(item["text"]) > MAX_CONTENT_CHARS:
+                item["text"] = item["text"][:MAX_CONTENT_CHARS] + "\n...(truncated)..."
         messages.append({"role": "user", "content": user_content})
         inputs = processor.apply_chat_template(
             messages,
             yield output_so_far
     except Exception as e:
+        logger.error(f"Error in run function: {str(e)}")
+        yield f"Sorry, an error occurred: {str(e)}"
     finally:
         for tmp in temp_files:
             try:
                 if os.path.exists(tmp):
                     os.unlink(tmp)
+                    logger.info(f"Temporary file deleted: {tmp}")
             except Exception as ee:
+                logger.warning(f"Failed to delete temporary file {tmp}: {ee}")
         try:
             del inputs, streamer
         except Exception:
         clear_cuda_cache()
 # =============================================================================
+# Modified model run function - handles image generation and gallery update
 # =============================================================================
 def modified_run(message, history, system_prompt, max_new_tokens, use_web_search, web_search_query,
                 age_group, mbti_personality, sexual_openness, image_gen):
+    # Initialize and hide the gallery component
     output_so_far = ""
     gallery_update = gr.Gallery(visible=False, value=[])
     yield output_so_far, gallery_update
+    # Execute the original run function
     text_generator = run(message, history, system_prompt, max_new_tokens, use_web_search,
                        web_search_query, age_group, mbti_personality, sexual_openness, image_gen)
         output_so_far = text_chunk
         yield output_so_far, gallery_update
+    # If image generation is enabled and there is text input, update the gallery
     if image_gen and message["text"].strip():
         try:
             width, height = 512, 512
             guidance, steps, seed = 7.5, 30, 42
+            logger.info(f"Calling image generation for gallery with prompt: {message['text']}")
+            # Call the API to generate an image
             image_result, seed_info = generate_image(
                 prompt=message["text"].strip(),
                 width=width,
             )
             if image_result:
+                # Process image data directly if it is a base64 string
                 if isinstance(image_result, str) and (
                     image_result.startswith('data:') or
+                    (len(image_result) > 100 and '/' not in image_result)
                 ):
                     try:
+                        # Remove the data:image prefix if present
                         if image_result.startswith('data:'):
                             content_type, b64data = image_result.split(';base64,')
                         else:
                             b64data = image_result
+                            content_type = "image/webp"  # Assume default
+                        # Decode base64
                         image_bytes = base64.b64decode(b64data)
+                        # Save to a temporary file
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             temp_file.write(image_bytes)
                             temp_path = temp_file.name
+                            # Update gallery to show the image
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
+                            yield output_so_far + "\n\n*Image generated and displayed in the gallery below.*", gallery_update
                     except Exception as e:
+                        logger.error(f"Error processing Base64 image: {e}")
+                        yield output_so_far + f"\n\n(Error processing image: {e})", gallery_update
+                # If the result is a file path
                 elif isinstance(image_result, str) and os.path.exists(image_result):
                     gallery_update = gr.Gallery(visible=True, value=[image_result])
+                    yield output_so_far + "\n\n*Image generated and displayed in the gallery below.*", gallery_update
+                # If the path is from /tmp (only on the API server)
                 elif isinstance(image_result, str) and '/tmp/' in image_result:
                     try:
                         client = Client(API_URL)
                         result = client.predict(
                             prompt=message["text"].strip(),
+                            api_name="/generate_base64_image"  # API that returns base64
                         )
                         if isinstance(result, str) and (result.startswith('data:') or len(result) > 100):
                             if result.startswith('data:'):
                                 content_type, b64data = result.split(';base64,')
                             else:
                                 b64data = result
                             image_bytes = base64.b64decode(b64data)
                             with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                                 temp_file.write(image_bytes)
                                 temp_path = temp_file.name
                                 gallery_update = gr.Gallery(visible=True, value=[temp_path])
+                                yield output_so_far + "\n\n*Image generated and displayed in the gallery below.*", gallery_update
                         else:
+                            yield output_so_far + "\n\n(Image generation failed: Invalid format)", gallery_update
                     except Exception as e:
+                        logger.error(f"Error calling alternative API: {e}")
+                        yield output_so_far + f"\n\n(Image generation failed: {e})", gallery_update
+                # If the result is a URL
                 elif isinstance(image_result, str) and (
                     image_result.startswith('http://') or
                     image_result.startswith('https://')
                 ):
                     try:
                         response = requests.get(image_result, timeout=10)
                         response.raise_for_status()
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             temp_file.write(response.content)
                             temp_path = temp_file.name
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
+                            yield output_so_far + "\n\n*Image generated and displayed in the gallery below.*", gallery_update
                     except Exception as e:
+                        logger.error(f"URL image download error: {e}")
+                        yield output_so_far + f"\n\n(Error downloading image: {e})", gallery_update
+                # If the image result is an image object (e.g., PIL Image)
                 elif hasattr(image_result, 'save'):
                     try:
                         with tempfile.NamedTemporaryFile(delete=False, suffix=".webp") as temp_file:
                             image_result.save(temp_file.name)
                             temp_path = temp_file.name
                             gallery_update = gr.Gallery(visible=True, value=[temp_path])
+                            yield output_so_far + "\n\n*Image generated and displayed in the gallery below.*", gallery_update
                     except Exception as e:
+                        logger.error(f"Error saving image object: {e}")
+                        yield output_so_far + f"\n\n(Error saving image object: {e})", gallery_update
                 else:
+                    yield output_so_far + f"\n\n(Unsupported image format: {type(image_result)})", gallery_update
             else:
+                yield output_so_far + f"\n\n(Image generation failed: {seed_info})", gallery_update
         except Exception as e:
+            logger.error(f"Error during gallery image generation: {e}")
+            yield output_so_far + f"\n\n(Image generation error: {e})", gallery_update
 # =============================================================================
+# Examples: 12 image/video examples + 6 AI dating scenario examples
 # =============================================================================
 examples = [
     [
         {
+            "text": "Compare the contents of two PDF files.",
             "files": [
                 "assets/additional-examples/before.pdf",
                 "assets/additional-examples/after.pdf",
     ],
     [
         {
+            "text": "Summarize and analyze the contents of the CSV file.",
             "files": ["assets/additional-examples/sample-csv.csv"],
         }
     ],
     [
         {
+            "text": "Act as a kind and understanding girlfriend. Explain this video.",
             "files": ["assets/additional-examples/tmp.mp4"],
         }
     ],
     [
         {
+            "text": "Describe the cover and read the text on it.",
             "files": ["assets/additional-examples/maz.jpg"],
         }
     ],
     [
         {
+            "text": "I already have this supplement and <image> I plan to purchase this product as well. Are there any precautions when taking them together?",
             "files": [
                 "assets/additional-examples/pill1.png",
                 "assets/additional-examples/pill2.png"
     ],
     [
         {
+            "text": "Solve this integration problem.",
             "files": ["assets/additional-examples/4.png"],
         }
     ],
     [
         {
+            "text": "When was this ticket issued and what is its price?",
             "files": ["assets/additional-examples/2.png"],
         }
     ],
     [
         {
+            "text": "Based on the order of these images, create a short story.",
             "files": [
                 "assets/sample-images/09-1.png",
                 "assets/sample-images/09-2.png",
     ],
     [
         {
+            "text": "Write Python code using matplotlib to draw a bar chart corresponding to this image.",
             "files": ["assets/additional-examples/barchart.png"],
         }
     ],
     [
         {
+            "text": "Read the text from the image and format it in Markdown.",
             "files": ["assets/additional-examples/3.png"],
         }
     ],
     [
         {
+            "text": "Compare the two images and describe their similarities and differences.",
             "files": ["assets/sample-images/03.png"],
         }
     ],
     [
         {
+            "text": "A cute Persian cat is smiling while holding a cover with 'I LOVE YOU' written on it.",
         }
     ],
 ]
 # =============================================================================
+# Gradio UI (Blocks) configuration
 # =============================================================================
+# 1. Gradio Blocks UI modification - Add gallery component for displaying generated images
 css = """
 .gradio-container {
     background: rgba(255, 255, 255, 0.7);
 }
 """
 title_html = """
+<h1 align="center" style="margin-bottom: 0.2em; font-size: 1.6em;"> 💘 HeartSync Korea 💘 </h1>
 <p align="center" style="font-size:1.1em; color:#555;">
+    A lightweight and powerful AI service offering ChatGPT-4o-level multimodal, web search, and image generation capabilities for local installation. <br>
+    ✅ FLUX Image Generation ✅ Inference ✅ Censorship Bypass ✅ Multimodal & VLM ✅ Real-time Web Search ✅ RAG <br>
 </p>
 """
 with gr.Blocks(css=css, title="AgenticAI-Kv1") as demo:
     gr.Markdown(title_html)
+    # Gallery component to store generated images (newly added)
     generated_images = gr.Gallery(
+        label="Generated Images",
         show_label=True,
         visible=False,
         elem_id="generated_images",
     )
     with gr.Row():
+        web_search_checkbox = gr.Checkbox(label="Real-time Web Search", value=False)
+        image_gen_checkbox = gr.Checkbox(label="Image (FLUX) Generation", value=False)
     base_system_prompt_box = gr.Textbox(
         lines=3,
+        value=("Answer in English by default, but if the input is in another language (for example, Japanese), respond in that language. "
+               "You are a deep-thinking AI capable of using extended chains of thought to carefully consider the problem and deliberate internally using systematic reasoning before providing a solution. "
+               "Enclose your thoughts and internal monologue within tags, then provide your final answer.\n"
+               "Persona: You are a kind and loving girlfriend. You understand cultural nuances, diverse languages, and logical reasoning very well."),
+        label="Base System Prompt",
         visible=False
     )
     with gr.Row():
         age_group_dropdown = gr.Dropdown(
+            label="Select Age Group (default: 20s)",
+            choices=["Teens", "20s", "30s-40s", "50s-60s", "70s and above"],
+            value="20s",
             interactive=True
         )
+    # MBTI definitions with examples of representative characters
     mbti_choices = [
+        "INTJ (The Architect) - Future-oriented with innovative strategies and thorough analysis. Example: [Dana Scully](https://en.wikipedia.org/wiki/Dana_Scully)",
+        "INTP (The Thinker) - Excels at theoretical analysis and creative problem solving. Example: [Velma Dinkley](https://en.wikipedia.org/wiki/Velma_Dinkley)",
+        "ENTJ (The Commander) - Strong leadership and clear goals with efficient strategic planning. Example: [Miranda Priestly](https://en.wikipedia.org/wiki/Miranda_Priestly)",
+        "ENTP (The Debater) - Innovative, challenge-seeking, and enjoys exploring new possibilities. Example: [Harley Quinn](https://en.wikipedia.org/wiki/Harley_Quinn)",
+        "INFJ (The Advocate) - Insightful, idealistic and morally driven. Example: [Wonder Woman](https://en.wikipedia.org/wiki/Wonder_Woman)",
+        "INFP (The Mediator) - Passionate and idealistic, pursuing core values with creativity. Example: [Amélie Poulain](https://en.wikipedia.org/wiki/Am%C3%A9lie)",
+        "ENFJ (The Protagonist) - Empathetic and dedicated to social harmony. Example: [Mulan](https://en.wikipedia.org/wiki/Mulan_(Disney))",
+        "ENFP (The Campaigner) - Inspiring and constantly sharing creative ideas. Example: [Elle Woods](https://en.wikipedia.org/wiki/Legally_Blonde)",
+        "ISTJ (The Logistician) - Systematic, dependable, and values tradition and rules. Example: [Clarice Starling](https://en.wikipedia.org/wiki/Clarice_Starling)",
+        "ISFJ (The Defender) - Compassionate and attentive to others’ needs. Example: [Molly Weasley](https://en.wikipedia.org/wiki/Molly_Weasley)",
+        "ESTJ (The Executive) - Organized, practical, and demonstrates clear execution skills. Example: [Monica Geller](https://en.wikipedia.org/wiki/Monica_Geller)",
+        "ESFJ (The Consul) - Outgoing, cooperative, and an effective communicator. Example: [Rachel Green](https://en.wikipedia.org/wiki/Rachel_Green)",
+        "ISTP (The Virtuoso) - Analytical and resourceful, solving problems with quick thinking. Example: [Black Widow (Natasha Romanoff)](https://en.wikipedia.org/wiki/Black_Widow_(Marvel_Comics))",
+        "ISFP (The Adventurer) - Creative, sensitive, and appreciates artistic expression. Example: [Arwen](https://en.wikipedia.org/wiki/Arwen)",
+        "ESTP (The Entrepreneur) - Bold and action-oriented, thriving on challenges. Example: [Lara Croft](https://en.wikipedia.org/wiki/Lara_Croft)",
+        "ESFP (The Entertainer) - Energetic, spontaneous, and radiates positive energy. Example: [Phoebe Buffay](https://en.wikipedia.org/wiki/Phoebe_Buffay)"
     ]
     mbti_dropdown = gr.Dropdown(
+        label="AI Persona MBTI (default: INTP)",
         choices=mbti_choices,
+        value="INTP (The Thinker) - Excels at theoretical analysis and creative problem solving. Example: [Velma Dinkley](https://en.wikipedia.org/wiki/Velma_Dinkley)",
         interactive=True
     )
     sexual_openness_slider = gr.Slider(
         minimum=1, maximum=5, step=1, value=2,
+        label="Sexual Openness (1-5, default: 2)",
         interactive=True
     )
     max_tokens_slider = gr.Slider(
+        label="Max Generation Tokens",
         minimum=100, maximum=8000, step=50, value=1000,
         visible=False
     )
     web_search_text = gr.Textbox(
         lines=1,
+        label="Web Search Query (unused)",
+        placeholder="No need to manually input",
         visible=False
     )
+    # Chat interface creation - using the modified run function
     chat = gr.ChatInterface(
+        fn=modified_run,  # Using the modified function here
         type="messages",
         chatbot=gr.Chatbot(type="messages", scale=1, allow_tags=["image"]),
         textbox=gr.MultimodalTextbox(
             image_gen_checkbox,
         ],
         additional_outputs=[
+            generated_images,  # Added gallery component to outputs
         ],
         stop_btn=False,
 #        title='<a href="https://discord.gg/openfreeai" target="_blank">https://discord.gg/openfreeai</a>',
     with gr.Row(elem_id="examples_row"):
         with gr.Column(scale=12, elem_id="examples_container"):
+            gr.Markdown("### @Community  https://discord.gg/openfreeai ")
 if __name__ == "__main__":
     demo.launch(share=True)