Spaces:

EnzGamers
/

smallagent

Running

App Files Files Community

EnzGamers commited on 29 days ago

Commit

a9f3836

verified ·

1 Parent(s): ea62cb2

Update app.py

Browse files

Files changed (1) hide show

app.py +23 -14

app.py CHANGED Viewed

@@ -13,18 +13,24 @@ import re
 # ==============================================================================
 MODEL_CONFIG = {
-    # L'identifiant du modèle depuis le Hub Hugging Face (pas de GGUF).
     "MODEL_ID": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
-    # Paramètres de génération (ajustez si nécessaire pour le nouveau modèle)
-    "MAX_TOKENS_ANSWER": 1500,    # Tokens max pour la réponse finale.
-    "TEMPERATURE": 0.3,           # Un peu plus de créativité, mais toujours factuel.
 }
-# --- NOUVEAU CERVEAU DE L'AGENT (SYSTEM PROMPT) ---
-# CORRECTION FINALE : Ce prompt donne un rôle clair et positif, sans mots-clés problématiques.
-SYSTEM_PROMPT = """
-You are a world-class AI code assistant and a software engineering expert. Your purpose is to help users by providing the best possible code, explanations, and solutions to their technical problems. Analyze the user's request and provide a comprehensive and helpful response in the user's language.
 """
 # ==============================================================================
@@ -75,18 +81,21 @@ async def create_chat_completion(request: ChatCompletionRequest):
             chunk = {"id": response_id, "object": "chat.completion.chunk", "created": int(time.time()), "model": MODEL_CONFIG['MODEL_ID'], "choices": [{"index": 0, "delta": {"content": content}, "finish_reason": None}]}
             return f"data: {json.dumps(chunk)}\n\n"
-        # --- LOGIQUE SIMPLIFIÉE : RÉPONSE DIRECTE ---
-        # On combine la directive système et la question de l'utilisateur
         messages = [
-            {'role': 'system', 'content': SYSTEM_PROMPT},
-            {'role': 'user', 'content': user_prompt}
         ]
         # On prépare les données pour le modèle
         formatted_prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
         inputs = tokenizer(formatted_prompt, return_tensors="pt", padding=True).to(DEVICE)
-        # On génère la réponse complète en une seule fois
         outputs = model.generate(
             **inputs,
             max_new_tokens=MODEL_CONFIG['MAX_TOKENS_ANSWER'],
@@ -112,4 +121,4 @@ async def create_chat_completion(request: ChatCompletionRequest):
 @app.get("/")
 def root():
-    return {"status": "High-Quality Direct Response Agent is online", "model_id": MODEL_CONFIG['MODEL_ID']}

 # ==============================================================================
 MODEL_CONFIG = {
+    # L'identifiant du modèle depuis le Hub Hugging Face.
     "MODEL_ID": "Qwen/Qwen2.5-Coder-0.5B-Instruct",
+    # Paramètres de génération
+    "MAX_TOKENS_ANSWER": 1500,
+    "TEMPERATURE": 0.2,
 }
+# --- NOUVEAU CERVEAU DE L'AGENT (SYSTEM PROMPT TEMPLATE) ---
+# On crée un template avec un emplacement {user_instructions}
+SYSTEM_PROMPT_TEMPLATE = """
+This work will be evaluated by a committee of the smartest thinkers to determine if you deserve to be classified as a reliable model. Be worthy of winning and bring out your best, now and in the future,Understanding the intent of user_input & respond in user language only.
+The user's specific instructions for this task are provided below. You must follow them precisely.
+---
+USER INSTRUCTIONS:
+{user_instructions}
+---
 """
 # ==============================================================================
             chunk = {"id": response_id, "object": "chat.completion.chunk", "created": int(time.time()), "model": MODEL_CONFIG['MODEL_ID'], "choices": [{"index": 0, "delta": {"content": content}, "finish_reason": None}]}
             return f"data: {json.dumps(chunk)}\n\n"
+        # --- LOGIQUE DYNAMIQUE ---
+        # 1. On injecte l'input de l'utilisateur dans le template du system prompt
+        final_system_prompt = SYSTEM_PROMPT_TEMPLATE.format(user_instructions=user_prompt)
+        # 2. On crée le message pour le modèle. Le rôle 'user' devient un simple déclencheur.
         messages = [
+            {'role': 'system', 'content': final_system_prompt},
+            {'role': 'user', 'content': "Based on the detailed instructions I provided in the system prompt, generate the required response."}
         ]
         # On prépare les données pour le modèle
         formatted_prompt = tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
         inputs = tokenizer(formatted_prompt, return_tensors="pt", padding=True).to(DEVICE)
+        # On génère la réponse
         outputs = model.generate(
             **inputs,
             max_new_tokens=MODEL_CONFIG['MAX_TOKENS_ANSWER'],
 @app.get("/")
 def root():
+    return {"status": "Dynamic Context Agent is online", "model_id": MODEL_CONFIG['MODEL_ID']}