Spaces:
Runtime error
Runtime error
from flask import Flask, request, jsonify | |
from app import generate_chat_completion | |
import time | |
app = Flask(__name__) | |
def chat_completions(): | |
data = request.json | |
messages = data.get('messages') # list of {"role":..., "content":...} | |
if not messages or not isinstance(messages, list): | |
return jsonify({"error": "A valid 'messages' list is required."}), 400 | |
try: | |
start = time.time() | |
new_history = generate_chat_completion( | |
message=messages[-1]['content'], | |
history=messages[:-1] # feed all except last user message | |
) | |
assistant_msg = new_history[-1]['content'] | |
elapsed = time.time() - start | |
return jsonify({ | |
"model": "tiiuae/falcon-rw-1b", | |
"choices": [{ | |
"message": {"role": "assistant", "content": assistant_msg} | |
}], | |
"usage": {"generation_time": round(elapsed, 2)}, | |
"history": new_history | |
}) | |
except Exception as e: | |
return jsonify({"error": str(e)}), 500 | |
def health_check(): | |
return "LLM API is running", 200 | |
if __name__ == '__main__': | |
app.run(host='0.0.0.0', port=8081) | |