Spaces:

Priyanshukr-1
/

openhermes_mistral_API

Sleeping

Priyanshu Kumar commited on Jul 16

Commit

43cc365

1 Parent(s): 37a2a92

Switch to Docker SDK for FastAPI app

Files changed (2) hide show

DOCKERFILE CHANGED Viewed

@@ -7,11 +7,9 @@ RUN useradd -m -u 1000 user
 USER user
 ENV PATH="/home/user/.local/bin:$PATH"
-#app directory is ./app where the FastAPI app is located
-WORKDIR /app
 COPY --chown=user ./requirements.txt requirements.txt
 RUN pip install --no-cache-dir --upgrade -r requirements.txt
-COPY --chown=user . /app
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

 USER user
 ENV PATH="/home/user/.local/bin:$PATH"
 COPY --chown=user ./requirements.txt requirements.txt
 RUN pip install --no-cache-dir --upgrade -r requirements.txt
+COPY . .
 CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

app.py ADDED Viewed

+from fastapi import FastAPI, Request
+from llama_cpp import Llama
+from huggingface_hub import hf_hub_download
+import os
+app = FastAPI()
+# === Model Config ===
+REPO_ID = "TheBloke/Mistral-7B-Instruct-v0.1-GGUF"
+FILENAME = "mistral-7b-instruct-v0.1.Q4_K_M.gguf"
+MODEL_DIR = "models"
+MODEL_PATH = os.path.join(MODEL_DIR, FILENAME)
+# === Download only if not already present ===
+if not os.path.exists(MODEL_PATH):
+    print(f"Downloading model {FILENAME} from Hugging Face...")
+    model_path = hf_hub_download(
+        repo_id=REPO_ID,
+        filename=FILENAME,
+        cache_dir=MODEL_DIR,
+        local_dir=MODEL_DIR,
+        local_dir_use_symlinks=False
+    )
+else:
+    print(f"Model already exists at: {MODEL_PATH}")
+    model_path = MODEL_PATH
+# === Load LLM ===
+llm = Llama(
+    model_path=model_path,
+    n_ctx=1024,
+    n_threads=4  # Adjust for your CPU
+)
+@app.get("/")
+def root():
+    return {"message": "Mistral API is live!"}
+@app.post("/generate")
+async def generate(request: Request):
+    data = await request.json()
+    prompt = data.get("prompt", "")
+    response = llm(prompt, max_tokens=128, temperature=0.7)
+    return {"response": response["choices"][0]["text"]}