ngcanh commited on
Commit
e091156
·
verified ·
1 Parent(s): e44ec40

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -2
app.py CHANGED
@@ -38,10 +38,10 @@ def load_model():
38
 
39
  model = AutoModelForCausalLM.from_pretrained(
40
  MODEL_NAME,
41
- quantization_config=nf4_config, # add config
42
  torch_dtype=torch.bfloat16, # save memory using float16
43
  # low_cpu_mem_usage=True,
44
- token=get_hg_token(),
45
  ).to("cuda")
46
 
47
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
 
38
 
39
  model = AutoModelForCausalLM.from_pretrained(
40
  MODEL_NAME,
41
+ # quantization_config=nf4_config, # add config
42
  torch_dtype=torch.bfloat16, # save memory using float16
43
  # low_cpu_mem_usage=True,
44
+ token=st.secrets["HF_TOKEN"],
45
  ).to("cuda")
46
 
47
  tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)