Spaces:

wangrongsheng
/

ChatGLM

Runtime error

wangrongsheng commited on Mar 15, 2023

Commit

cd7ddd1

1 Parent(s): 4223a6d

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,40 +1,30 @@
-from transformers import AutoModel, AutoTokenizer
 import gradio as gr
 tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
-model = AutoModel.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).half().cuda()
-model = model.eval()
-MAX_TURNS = 20
-MAX_BOXES = MAX_TURNS * 2
-def predict(input, history=None):
-    if history is None:
-        history = []
-    response, history = model.chat(tokenizer, input, history)
-    updates = []
-    for query, response in history:
-        updates.append(gr.update(visible=True, value="用户：" + query))
-        updates.append(gr.update(visible=True, value="ChatGLM-6B：" + response))
-    if len(updates) < MAX_BOXES:
-        updates = updates + [gr.Textbox.update(visible=False)] * (MAX_BOXES - len(updates))
-    return [history] + updates
-with gr.Blocks() as demo:
-    state = gr.State([])
-    text_boxes = []
-    for i in range(MAX_BOXES):
-        if i % 2 == 0:
-            text_boxes.append(gr.Markdown(visible=False, label="提问："))
-        else:
-            text_boxes.append(gr.Markdown(visible=False, label="回复："))
-    with gr.Row():
-        with gr.Column(scale=4):
-            txt = gr.Textbox(show_label=False, placeholder="Enter text and press enter").style(container=False)
-        with gr.Column(scale=1):
-            button = gr.Button("Generate")
-    button.click(predict, [txt, state], [state] + text_boxes)
-demo.queue().launch(share=False)

+import psutil
 import gradio as gr
+from functools import partial
+from transformers import AutoTokenizer, AutoModelForSeq2SeqLM
+mem = psutil.virtual_memory()
 tokenizer = AutoTokenizer.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True)
+model = AutoModelForSeq2SeqLM.from_pretrained("THUDM/chatglm-6b", trust_remote_code=True).bfloat16()
+def chat(query, history=[]):
+    _, history = model.chat(tokenizer, query, history, max_length=512)
+    return history, history
+description = "This is an unofficial chatbot application based on open source model ChatGLM-6B(https://github.com/THUDM/ChatGLM-6B), running on cpu(therefore max_length is limited to 512). \nIf you want to use this chat bot in your space, 'Duplicate this space' by click the button close to 'Linked Models'. \n"
+title = "ChatGLM-6B Chatbot"
+examples = [["Hello?"], ["你好。"], ["介绍清华"]]
+chatbot_interface = gr.Interface(
+    fn=chat,
+    title=title,
+    description=description,
+    examples=examples,
+    inputs=["text", "state"],
+    outputs=["chatbot", "state"]
+)
+chatbot_interface.launch()