3ML_bot_RTL

Sleeping

nikravan commited on Jun 18, 2024

Commit

5171ca7

verified ·

1 Parent(s): 97c89d2

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,7 +33,7 @@ h1 {
 }
 """
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
@@ -99,12 +99,15 @@ def mode_load(path):
 @spaces.GPU()
 def stream_chat(message, history: list, temperature: float, max_length: int, top_p: float, top_k: int, penalty: float):
-    model = AutoModelForCausalLM.from_pretrained(
-        MODEL_ID,
-        torch_dtype=torch.bfloat16,
-        low_cpu_mem_usage=True,
-        trust_remote_code=True
-    )
     print(f'message is - {message}')
     print(f'history is - {history}')

 }
 """
+model=""
 tokenizer = AutoTokenizer.from_pretrained(MODEL_ID, trust_remote_code=True)
 @spaces.GPU()
 def stream_chat(message, history: list, temperature: float, max_length: int, top_p: float, top_k: int, penalty: float):
+    if model=="":
+        model = AutoModelForCausalLM.from_pretrained(
+            MODEL_ID,
+            torch_dtype=torch.bfloat16,
+            low_cpu_mem_usage=True,
+            trust_remote_code=True
+        )
     print(f'message is - {message}')
     print(f'history is - {history}')