Tonic commited on
Commit
cc9677b
·
1 Parent(s): c026c75

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -33,11 +33,11 @@ repetition_penalty=1.7
33
 
34
  tokenizer = transformers.AutoTokenizer.from_pretrained(model_name)
35
  model = transformers.AutoModelForCausalLM.from_pretrained(model_name,
36
- device_map="auto",
37
- torch_dtype=torch.float16,
38
  # load_in_4bit=True
39
  )
40
- model.eval()
41
 
42
  class StarlingBot:
43
  def __init__(self, system_prompt="The following dialogue is a conversation"):
 
33
 
34
  tokenizer = transformers.AutoTokenizer.from_pretrained(model_name)
35
  model = transformers.AutoModelForCausalLM.from_pretrained(model_name,
36
+ device_map="auto"
37
+ torch_dtype=torch.bfloat16,
38
  # load_in_4bit=True
39
  )
40
+ # model.eval()
41
 
42
  class StarlingBot:
43
  def __init__(self, system_prompt="The following dialogue is a conversation"):