Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
@@ -1,10 +1,17 @@
|
|
1 |
from fastapi import FastAPI
|
2 |
import uvicorn
|
3 |
-
from transformers import AutoTokenizer,
|
4 |
|
5 |
model_name = "TheBloke/Wizard-Vicuna-13B-Uncensored-HF"
|
6 |
|
7 |
-
model =
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
9 |
tokenizer.pad_token = tokenizer.eos_token
|
10 |
|
|
|
1 |
from fastapi import FastAPI
|
2 |
import uvicorn
|
3 |
+
from transformers import AutoTokenizer, AutoModelForCausalLM
|
4 |
|
5 |
model_name = "TheBloke/Wizard-Vicuna-13B-Uncensored-HF"
|
6 |
|
7 |
+
model = AutoModelForCausalLM.from_pretrained(
|
8 |
+
model_name,
|
9 |
+
device_map="auto", # Auto-distribute layers across CPU/GPU
|
10 |
+
low_cpu_mem_usage=True, # Reduces CPU RAM during loading
|
11 |
+
torch_dtype="auto", # Automatically select dtype (float16/32)
|
12 |
+
offload_folder="offload",
|
13 |
+
trust_remote_code=True
|
14 |
+
)
|
15 |
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)
|
16 |
tokenizer.pad_token = tokenizer.eos_token
|
17 |
|