ndc8
commited on
Commit
·
a2a4e98
1
Parent(s):
0c37db0
Fix GGUF filename in environment variable and update comment in requirements
Browse files- gguf_transformers_backend.py +1 -1
- requirements.txt +1 -1
gguf_transformers_backend.py
CHANGED
@@ -65,7 +65,7 @@ class HealthResponse(BaseModel):
|
|
65 |
|
66 |
# Global variables for model management
|
67 |
current_model = os.environ.get("AI_MODEL", "unsloth/gemma-3n-E4B-it-GGUF")
|
68 |
-
gguf_filename = os.environ.get("GGUF_FILE", "
|
69 |
tokenizer = None
|
70 |
model = None
|
71 |
text_pipeline = None
|
|
|
65 |
|
66 |
# Global variables for model management
|
67 |
current_model = os.environ.get("AI_MODEL", "unsloth/gemma-3n-E4B-it-GGUF")
|
68 |
+
gguf_filename = os.environ.get("GGUF_FILE", "gemma-3n-E4B-it-Q4_K_M.gguf")
|
69 |
tokenizer = None
|
70 |
model = None
|
71 |
text_pipeline = None
|
requirements.txt
CHANGED
@@ -12,7 +12,7 @@ transformers>=4.45.0
|
|
12 |
torch>=2.0.0
|
13 |
accelerate
|
14 |
|
15 |
-
# Required
|
16 |
protobuf
|
17 |
sentencepiece>=0.2.0
|
18 |
tokenizers
|
|
|
12 |
torch>=2.0.0
|
13 |
accelerate
|
14 |
|
15 |
+
# Required for GGUF model loading
|
16 |
protobuf
|
17 |
sentencepiece>=0.2.0
|
18 |
tokenizers
|