Mistral-lab

Running on Zero

vilarin commited on Jul 18, 2024

Commit

c95f150

verified ·

1 Parent(s): f6cebe3

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -38,7 +38,7 @@ model = AutoModelForCausalLM.from_pretrained(
     MODEL,
     torch_dtype=torch.bfloat16,
     device_map="auto",
-    ignore_mismatched_sizes=True).to(device)
 @spaces.GPU()
 def stream_chat(
@@ -86,8 +86,6 @@ def stream_chat(
         yield buffer
-    #print(tokenizer.decode(outputs[0]))
 chatbot = gr.Chatbot(height=600, placeholder=PLACEHOLDER)
 with gr.Blocks(css=CSS, theme="soft") as demo:

     MODEL,
     torch_dtype=torch.bfloat16,
     device_map="auto",
+    ignore_mismatched_sizes=True)
 @spaces.GPU()
 def stream_chat(
         yield buffer
 chatbot = gr.Chatbot(height=600, placeholder=PLACEHOLDER)
 with gr.Blocks(css=CSS, theme="soft") as demo: