Update app.py
Browse files
app.py
CHANGED
@@ -62,7 +62,7 @@ logger.info(f"Using n_threads: {recommended_threads}")
|
|
62 |
try:
|
63 |
llm = Llama(
|
64 |
model_path=model_path,
|
65 |
-
n_ctx=
|
66 |
n_threads=recommended_threads,
|
67 |
use_mlock=True, # Lock model in RAM for faster access
|
68 |
n_gpu_layers=0, # CPU only
|
|
|
62 |
try:
|
63 |
llm = Llama(
|
64 |
model_path=model_path,
|
65 |
+
n_ctx=2048, # Context window size for the model (still needed, but not fully utilized for history)
|
66 |
n_threads=recommended_threads,
|
67 |
use_mlock=True, # Lock model in RAM for faster access
|
68 |
n_gpu_layers=0, # CPU only
|