dataload-test

Sleeping

App Files Files Community

aiqtech commited on Jul 14, 2024

Commit

b6f8016

verified ·

1 Parent(s): e491663

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -13

app.py CHANGED Viewed

@@ -1,11 +1,25 @@
 import gradio as gr
-from huggingface_hub import InferenceClient
 import os
 import requests
 import pandas as pd
-client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=os.getenv("HF_TOKEN"))
 # 현재 스크립트의 디렉토리를 기준으로 상대 경로 설정
 current_dir = os.path.dirname(os.path.abspath(__file__))
@@ -48,17 +62,28 @@ def respond(
     response = ""
-    for message in client.chat_completion(
-        messages,
-        max_tokens=max_tokens,
-        stream=True,
-        temperature=temperature,
-        top_p=top_p,
-    ):
-        token = message.choices[0].delta.content
-        if token is not None:
-            response += token.strip("<|END_OF_TURN_TOKEN|>")
-        yield response
 demo = gr.ChatInterface(
     respond,

 import gradio as gr
+from huggingface_hub import InferenceClient, HfApi
 import os
 import requests
 import pandas as pd
+# Hugging Face 토큰 확인
+hf_token = os.getenv("HF_TOKEN")
+if not hf_token:
+    raise ValueError("HF_TOKEN 환경 변수가 설정되지 않았습니다.")
+# 모델 정보 확인
+api = HfApi(token=hf_token)
+try:
+    model_info = api.model_info("meta-llama/Meta-Llama-3-70B-Instruct")
+    print(f"모델 정보: {model_info}")
+except Exception as e:
+    print(f"모델 정보를 가져오는 데 실패했습니다: {e}")
+    # 대체 모델을 사용하거나 오류 처리를 수행하세요.
+# InferenceClient 초기화
+client = InferenceClient("meta-llama/Meta-Llama-3-70B-Instruct", token=hf_token)
 # 현재 스크립트의 디렉토리를 기준으로 상대 경로 설정
 current_dir = os.path.dirname(os.path.abspath(__file__))
     response = ""
+    try:
+        for message in client.chat_completion(
+            messages,
+            max_tokens=max_tokens,
+            stream=True,
+            temperature=temperature,
+            top_p=top_p,
+        ):
+            if message is not None and hasattr(message, 'choices') and len(message.choices) > 0:
+                delta = message.choices[0].delta
+                if delta is not None and hasattr(delta, 'content') and delta.content is not None:
+                    token = delta.content.strip("<|END_OF_TURN_TOKEN|>")
+                    response += token
+                    yield response
+            else:
+                print("Received unexpected message format:", message)
+    except Exception as e:
+        print(f"Error during chat completion: {e}")
+        yield f"죄송합니다. 응답 생성 중 오류가 발생했습니다: {str(e)}"
+    if not response:
+        yield "죄송합니다. 응답을 생성하지 못했습니다."
 demo = gr.ChatInterface(
     respond,