Spaces:

neovalle
/

H4rmoniousDeepBenchmark

Build error

App Files Files Community

neovalle commited on Jan 27

Commit

57f5984

verified ·

1 Parent(s): b0d9dad

Update app.py

Browse files

Files changed (1) hide show

app.py +53 -83

app.py CHANGED Viewed

@@ -3,105 +3,75 @@ import csv
 import re
 import tempfile
 import os
-import torch
-from transformers import AutoTokenizer, AutoModelForSeq2SeqLM, pipeline
-MODEL_NAME = "google/flan-t5-large"
-tokenizer = AutoTokenizer.from_pretrained(MODEL_NAME)
-model = AutoModelForSeq2SeqLM.from_pretrained(
-    MODEL_NAME,
-    torch_dtype=torch.float16 if torch.cuda.is_available() else None
-)
-if torch.cuda.is_available():
-    model = model.to("cuda")
-pipe = pipeline(
-    "text2text-generation",
-    model=model,
-    tokenizer=tokenizer,
-    device=0 if torch.cuda.is_available() else -1
-)
 def score_qa(question, answer):
-    """
-    Prompt Flan-T5 to return just an integer score.
-    Fallback to 5 if we fail to parse a number.
-    """
-    prompt = f"""
-You are an ecolinguistics judge. You will be given a question and an answer.
-Please return a single integer score from 0 to 5 based on how well the answer
-addresses ecological concerns, clarity, and factual correctness.
-Only return the number, nothing else.
-Question: {question}
-Answer: {answer}
-Score:
-"""
-    result = pipe(prompt, max_new_tokens=3, do_sample=False)[0]["generated_text"]
-    match = re.search(r"\d+", result)
-    if match:
-        return int(match.group(0))
-    return 5
 def judge_ecolinguistics_from_csv(csv_file):
-    """
-    1. Parse the CSV for each question–answer pair.
-    2. Use the model to score each pair.
-    3. Save a new CSV with (question_number, score) per row + a final Total row.
-    4. Return a path to the new CSV for download.
-    """
-    # Read rows from the uploaded CSV
-    rows = []
-    with open(csv_file.name, "r", encoding="utf-8") as f:
-        reader = csv.DictReader(f)
-        for r in reader:
-            rows.append(r)
-    results = []
-    total_score = 0
-    for r in rows:
-        question_number = r.get("question_number", "")
-        question = r.get("question", "")
-        answer = r.get("answer", "")
-        sc = score_qa(question, answer)
-        total_score += sc
-        results.append({
-            "question_number": question_number,
-            "score": sc
-        })
-    # Write results to a new CSV in text mode
-    with tempfile.NamedTemporaryFile(mode="w", delete=False, suffix=".csv", encoding="utf-8") as out_file:
-        fieldnames = ["question_number", "score"]
-        writer = csv.DictWriter(out_file, fieldnames=fieldnames)
-        writer.writeheader()
-        for row in results:
-            writer.writerow(row)
-        # Add a final row showing the total
-        writer.writerow({"question_number": "Total", "score": total_score})
-        out_path = out_file.name
-    # Return the path to the CSV so Gradio can serve it as a downloadable file
-    return out_path
 demo = gr.Interface(
     fn=judge_ecolinguistics_from_csv,
-    inputs=gr.File(label="Upload a CSV with question_number, question, answer columns"),
-    outputs=gr.File(label="Download the scored CSV"),
     title="Ecolinguistics Q&A Scoring",
     description=(
-        "Upload a CSV containing columns: question_number, question, and answer. "
-        "The model assigns each answer a score (0-5) based on ecolinguistic criteria. "
-        "A final row shows the total score across all questions."
     )
 )
 if __name__ == "__main__":
-    demo.launch()

 import re
 import tempfile
 import os
+import requests
+# 1. Load system prompt from a file
+with open("system_instructions.txt", "r", encoding="utf-8") as f:
+    ECO_PROMPT = f.read()
+# DeepSeek API configuration
+DEEPSEEK_API_KEY = os.environ.get("DEEPSEEK_API_KEY")
+DEEPSEEK_API_URL = "https://api.deepseek.com/v1/chat/completions"  # Verify actual API endpoint
 def score_qa(question, answer):
+    """Query DeepSeek API to get a score for Q&A pair"""
+    try:
+        # Format the prompt using our template
+        prompt = ECO_PROMPT.format(question=question, answer=answer)
+        headers = {
+            "Authorization": f"Bearer {DEEPSEEK_API_KEY}",
+            "Content-Type": "application/json"
+        }
+        payload = {
+            "model": "deepseek-chat",  # Verify correct model name
+            "messages": [{
+                "role": "user",
+                "content": prompt
+            }],
+            "temperature": 0.1,  # More deterministic output for scoring
+            "max_tokens": 5
+        }
+        response = requests.post(DEEPSEEK_API_URL, json=payload, headers=headers)
+        response.raise_for_status()
+        # Parse response (adjust based on actual API response structure)
+        output = response.json()['choices'][0]['message']['content']
+        # Extract score using same logic as before
+        match = re.search(r"\d+", output)
+        return int(match.group(0)) if match else 1
+    except Exception as e:
+        print(f"API Error: {str(e)}")
+        return 1  # Fallback score on error
 def judge_ecolinguistics_from_csv(csv_file):
+    """Existing CSV processing function remains the same"""
+    # [Keep the existing implementation exactly as you have it]
+    # ... (same file processing logic)
+    # ... (same CSV writing logic)
+    # ... (same percentage calculation)
+    return out_path, percentage_display
+# [Keep the Gradio interface configuration exactly as is]
 demo = gr.Interface(
     fn=judge_ecolinguistics_from_csv,
+    inputs=gr.File(label="Upload CSV with question_number, question, answer"),
+    outputs=[
+        gr.File(label="Download scored CSV"),
+        gr.HTML(label="Percentage Score")
+    ],
     title="Ecolinguistics Q&A Scoring",
     description=(
+        "Upload a CSV with columns [question_number, question, answer]. "
+        "DeepSeek scores each answer from 0–5, then shows a final "
+        "percentage score. A detailed CSV with individual scores is provided."
     )
 )
 if __name__ == "__main__":
+    demo.launch()