Spaces:

seawolf2357
/

kai-flx

Runtime error

App Files Files Community

seawolf2357 commited on Jun 15, 2024

Commit

922d19a

verified ·

1 Parent(s): cb69e60

Update app.py

Browse files

Files changed (1) hide show

app.py +10 -6

app.py CHANGED Viewed

@@ -15,7 +15,6 @@ intents.messages = True
 # hf_client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=os.getenv("HF_TOKEN"))
 hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus", token=os.getenv("HF_TOKEN"))
 # 대화 히스토리를 저장할 변수
 conversation_history = []
@@ -31,13 +30,14 @@ class MyClient(discord.Client):
             logging.info('자신의 메시지는 무시합니다.')
             return
-        logging.debug(f'Receiving message: {message.content}')
         response = await generate_response(message.content)
         await message.channel.send(response)
 async def generate_response(user_input):
-    system_message = "DISCORD에서 사용자들의 질문에 친절하게 답하는 전문 AI 어시스턴트입니다. 대화를 계속 이어가고, 이전 응답을 참고하십시오."
     system_prefix = """
     반드시 한글로 답변하십시오. 출력시 띄워쓰기를 하고 markdown으로 출력하라.
     질문에 적합한 답변을 제공하며, 가능한 한 구체적이고 도움이 되는 답변을 제공하십시오.
     모든 답변을 한글로 하고, 대화 내용을 기억하십시오.
@@ -45,25 +45,29 @@ async def generate_response(user_input):
     반드시 한글로 답변하십시오.
     """
     # 대화 히스토리 관리
     global conversation_history
     conversation_history.append({"role": "user", "content": user_input})
     messages = [{"role": "system", "content": f"{system_prefix} {system_message}"}] + conversation_history
     # 동기 함수를 비동기로 처리하기 위한 래퍼 사용, stream=true로 변경
     loop = asyncio.get_event_loop()
     response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
-        messages, max_tokens=250, stream=True, temperature=0.9, top_p=0.9))
     # 스트리밍 응답을 처리하는 로직 추가
     full_response = ""
     for part in response:
-        full_response += part.choices[0].delta.content.strip()
     conversation_history.append({"role": "assistant", "content": full_response})
-    logging.debug(f'Model response: {full_response}')
     return full_response
 # 디스코드 봇 인스턴스 생성 및 실행

 # hf_client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=os.getenv("HF_TOKEN"))
 hf_client = InferenceClient("CohereForAI/c4ai-command-r-plus", token=os.getenv("HF_TOKEN"))
 # 대화 히스토리를 저장할 변수
 conversation_history = []
             logging.info('자신의 메시지는 무시합니다.')
             return
+        logging.debug(f'Receiving message: {message.content}')  # 입력 메시지 로깅
         response = await generate_response(message.content)
         await message.channel.send(response)
 async def generate_response(user_input):
+    system_message = "DISCORD에서 사용자들의 질문에 답하는 전문 AI 어시스턴트입니다. 대화를 계속 이어가고, 이전 응답을 참고하십시오."
     system_prefix = """
     반드시 한글로 답변하십시오. 출력시 띄워쓰기를 하고 markdown으로 출력하라.
     질문에 적합한 답변을 제공하며, 가능한 한 구체적이고 도움이 되는 답변을 제공하십시오.
     모든 답변을 한글로 하고, 대화 내용을 기억하십시오.
     반드시 한글로 답변하십시오.
     """
     # 대화 히스토리 관리
     global conversation_history
     conversation_history.append({"role": "user", "content": user_input})
+    logging.debug(f'Conversation history updated: {conversation_history}')  # 대화 히스토리 로깅
     messages = [{"role": "system", "content": f"{system_prefix} {system_message}"}] + conversation_history
+    logging.debug(f'Messages to be sent to the model: {messages}')  # 모델로 전송될 메시지 로깅
     # 동기 함수를 비동기로 처리하기 위한 래퍼 사용, stream=true로 변경
     loop = asyncio.get_event_loop()
     response = await loop.run_in_executor(None, lambda: hf_client.chat_completion(
+        messages, max_tokens=1000, stream=True, temperature=0.7, top_p=0.85))
     # 스트리밍 응답을 처리하는 로직 추가
     full_response = ""
     for part in response:
+        if part.choices and part.choices[0].delta.content:  # 델타가 있는지 확인
+            full_response += part.choices[0].delta.content.strip()
     conversation_history.append({"role": "assistant", "content": full_response})
+    logging.debug(f'Model response: {full_response}')  # 응답 로깅
     return full_response
 # 디스코드 봇 인스턴스 생성 및 실행