Tim Luka Horstmann
commited on
Commit
·
bd95004
1
Parent(s):
58272f8
bigger model
Browse files
app.py
CHANGED
@@ -42,11 +42,12 @@ try:
|
|
42 |
# Load Qwen 2.5 1.5B model with llama_cpp
|
43 |
logger.info("Loading Qwen 2.5 1.5B model")
|
44 |
model_path = hf_hub_download(
|
45 |
-
repo_id="Qwen/Qwen2.5-1.5B-Instruct-GGUF",
|
46 |
-
filename="qwen2.5-1.5b-instruct-q4_0.gguf",
|
47 |
local_dir="/app/cache" if os.getenv("HF_HOME") else None,
|
48 |
token=hf_token,
|
49 |
)
|
|
|
50 |
generator = Llama(
|
51 |
model_path=model_path,
|
52 |
n_ctx=2048,
|
|
|
42 |
# Load Qwen 2.5 1.5B model with llama_cpp
|
43 |
logger.info("Loading Qwen 2.5 1.5B model")
|
44 |
model_path = hf_hub_download(
|
45 |
+
repo_id="bartowski/Qwen2.5-7B-Instruct-GGUF", #"Qwen/Qwen2.5-1.5B-Instruct-GGUF",
|
46 |
+
filename="Qwen2.5-7B-Instruct-Q6_K.gguf", #"qwen2.5-1.5b-instruct-q4_0.gguf",
|
47 |
local_dir="/app/cache" if os.getenv("HF_HOME") else None,
|
48 |
token=hf_token,
|
49 |
)
|
50 |
+
|
51 |
generator = Llama(
|
52 |
model_path=model_path,
|
53 |
n_ctx=2048,
|