DesiredName commited on
Commit
383a904
·
verified ·
1 Parent(s): 752eb63

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -2
app.py CHANGED
@@ -1,10 +1,17 @@
1
  from fastapi import FastAPI
2
  import uvicorn
3
- from transformers import AutoTokenizer, AutoModel
4
 
5
  model_name = "TheBloke/Wizard-Vicuna-13B-Uncensored-HF"
6
 
7
- model = AutoModel.from_pretrained(model_name, trust_remote_code=True)
 
 
 
 
 
 
 
8
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
9
  tokenizer.pad_token = tokenizer.eos_token
10
 
 
1
  from fastapi import FastAPI
2
  import uvicorn
3
+ from transformers import AutoTokenizer, AutoModelForCausalLM
4
 
5
  model_name = "TheBloke/Wizard-Vicuna-13B-Uncensored-HF"
6
 
7
+ model = AutoModelForCausalLM.from_pretrained(
8
+ model_name,
9
+ device_map="auto", # Auto-distribute layers across CPU/GPU
10
+ low_cpu_mem_usage=True, # Reduces CPU RAM during loading
11
+ torch_dtype="auto", # Automatically select dtype (float16/32)
12
+ offload_folder="offload",
13
+ trust_remote_code=True
14
+ )
15
  tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
16
  tokenizer.pad_token = tokenizer.eos_token
17