ateetvatan commited on
Commit
6b456ee
·
1 Parent(s): 8dd6602
Files changed (1) hide show
  1. model_loader.py +2 -2
model_loader.py CHANGED
@@ -16,10 +16,10 @@ CTX_LEN = int(os.getenv("CTX_LEN", "8192")) # Use full 8K context
16
 
17
  # === Load Model ===
18
  model = AutoModelForCausalLM.from_pretrained(
19
- model_path=MODEL_REPO,
20
  model_file=MODEL_FILE,
21
  model_type=MODEL_TYPE,
22
  context_length=CTX_LEN,
23
- gpu_layers=0, # Set >0 if you want to offload layers to GPU
24
  local_files_only=False,
25
  )
 
16
 
17
  # === Load Model ===
18
  model = AutoModelForCausalLM.from_pretrained(
19
+ MODEL_REPO,
20
  model_file=MODEL_FILE,
21
  model_type=MODEL_TYPE,
22
  context_length=CTX_LEN,
23
+ gpu_layers=0,
24
  local_files_only=False,
25
  )