Starling

Paused

Tonic commited on Nov 28, 2023

Commit

cc9677b

1 Parent(s): c026c75

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -33,11 +33,11 @@ repetition_penalty=1.7
 tokenizer = transformers.AutoTokenizer.from_pretrained(model_name)
 model = transformers.AutoModelForCausalLM.from_pretrained(model_name,
-    device_map="auto",
-    torch_dtype=torch.float16,
 #   load_in_4bit=True
 )
-model.eval()
 class StarlingBot:
     def __init__(self, system_prompt="The following dialogue is a conversation"):

 tokenizer = transformers.AutoTokenizer.from_pretrained(model_name)
 model = transformers.AutoModelForCausalLM.from_pretrained(model_name,
+    device_map="auto"
+    torch_dtype=torch.bfloat16,
 #   load_in_4bit=True
 )
+# model.eval()
 class StarlingBot:
     def __init__(self, system_prompt="The following dialogue is a conversation"):