DesiredName commited on
Commit
83c94c3
·
verified ·
1 Parent(s): bc8a564

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +1 -10
app.py CHANGED
@@ -1,21 +1,12 @@
1
  from fastapi import FastAPI
2
  import uvicorn
3
- import torch
4
- from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig
5
 
6
  model_name = "Tap-M/Luna-AI-Llama2-Uncensored"
7
 
8
- bnb_config = BitsAndBytesConfig(
9
- load_in_4bit=True,
10
- bnb_4bit_quant_type="nf4", # Must be 'nf4' for CPU compatibility
11
- bnb_4bit_compute_dtype="float32", # Use float32 for CPU computation
12
- bnb_4bit_use_double_quant=True
13
- )
14
-
15
  model = AutoModelForCausalLM.from_pretrained(
16
  model_name, # Example model
17
  device_map="auto", # Auto-distribute across GPU/CPU
18
- quantization_config=bnb_config,
19
  offload_folder="./offload", # Temporary directory
20
  trust_remote_code=True # Required for some models
21
  )
 
1
  from fastapi import FastAPI
2
  import uvicorn
3
+ from transformers import AutoModelForCausalLM, AutoTokenizer
 
4
 
5
  model_name = "Tap-M/Luna-AI-Llama2-Uncensored"
6
 
 
 
 
 
 
 
 
7
  model = AutoModelForCausalLM.from_pretrained(
8
  model_name, # Example model
9
  device_map="auto", # Auto-distribute across GPU/CPU
 
10
  offload_folder="./offload", # Temporary directory
11
  trust_remote_code=True # Required for some models
12
  )