orionweller commited on
Commit
fbb5c51
·
1 Parent(s): 1239c17
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -70,8 +70,9 @@ def load_model():
70
  tokenizer.padding_side = "right"
71
 
72
  # model = AutoModel.from_pretrained(CUR_MODEL, max_memory={"cpu": "12GiB"}, torch_dtype=torch.bfloat16, offload_state_dict=True)
73
- base_model_instance = AutoModel.from_pretrained(BASE_MODEL, device="cpu")
74
- model = PeftModel.from_pretrained(base_model_instance, CUR_MODEL, device="cpu")
 
75
  model.eval()
76
 
77
 
 
70
  tokenizer.padding_side = "right"
71
 
72
  # model = AutoModel.from_pretrained(CUR_MODEL, max_memory={"cpu": "12GiB"}, torch_dtype=torch.bfloat16, offload_state_dict=True)
73
+ base_model_instance = AutoModel.from_pretrained(BASE_MODEL)
74
+ model = PeftModel.from_pretrained(base_model_instance, CUR_MODEL)
75
+ model = model.merge_and_unload()
76
  model.eval()
77
 
78