Tim Luka Horstmann commited on
Commit
bd95004
·
1 Parent(s): 58272f8

bigger model

Browse files
Files changed (1) hide show
  1. app.py +3 -2
app.py CHANGED
@@ -42,11 +42,12 @@ try:
42
  # Load Qwen 2.5 1.5B model with llama_cpp
43
  logger.info("Loading Qwen 2.5 1.5B model")
44
  model_path = hf_hub_download(
45
- repo_id="Qwen/Qwen2.5-1.5B-Instruct-GGUF",
46
- filename="qwen2.5-1.5b-instruct-q4_0.gguf",
47
  local_dir="/app/cache" if os.getenv("HF_HOME") else None,
48
  token=hf_token,
49
  )
 
50
  generator = Llama(
51
  model_path=model_path,
52
  n_ctx=2048,
 
42
  # Load Qwen 2.5 1.5B model with llama_cpp
43
  logger.info("Loading Qwen 2.5 1.5B model")
44
  model_path = hf_hub_download(
45
+ repo_id="bartowski/Qwen2.5-7B-Instruct-GGUF", #"Qwen/Qwen2.5-1.5B-Instruct-GGUF",
46
+ filename="Qwen2.5-7B-Instruct-Q6_K.gguf", #"qwen2.5-1.5b-instruct-q4_0.gguf",
47
  local_dir="/app/cache" if os.getenv("HF_HOME") else None,
48
  token=hf_token,
49
  )
50
+
51
  generator = Llama(
52
  model_path=model_path,
53
  n_ctx=2048,