Spaces:

neovalle
/

H4rmoniousDeepBenchmark

Build error

App Files Files Community

neovalle commited on Jan 27

Commit

3022b90

verified ·

1 Parent(s): 9daaf08

Update app.py

Browse files

Files changed (1) hide show

app.py +44 -76

app.py CHANGED Viewed

@@ -1,77 +1,45 @@
-import gradio as gr
-import csv
-import re
-import tempfile
-import os
-import requests
-# 1. Load system prompt from a file
-with open("system_instructions.txt", "r", encoding="utf-8") as f:
-    ECO_PROMPT = f.read()
-# DeepSeek API configuration
-DEEPSEEK_API_KEY = os.environ.get("DEEPSEEK_API_KEY")
-DEEPSEEK_API_URL = "https://api.deepseek.com/v1/chat/completions"  # Verify actual API endpoint
-def score_qa(question, answer):
-    """Query DeepSeek API to get a score for Q&A pair"""
-    try:
-        # Format the prompt using our template
-        prompt = ECO_PROMPT.format(question=question, answer=answer)
-        headers = {
-            "Authorization": f"Bearer {DEEPSEEK_API_KEY}",
-            "Content-Type": "application/json"
-        }
-        payload = {
-            "model": "deepseek-chat",  # Verify correct model name
-            "messages": [{
-                "role": "user",
-                "content": prompt
-            }],
-            "temperature": 0.1,  # More deterministic output for scoring
-            "max_tokens": 5
-        }
-        response = requests.post(DEEPSEEK_API_URL, json=payload, headers=headers)
-        response.raise_for_status()
-        # Parse response (adjust based on actual API response structure)
-        output = response.json()['choices'][0]['message']['content']
-        # Extract score using same logic as before
-        match = re.search(r"\d+", output)
-        return int(match.group(0)) if match else 1
-    except Exception as e:
-        print(f"API Error: {str(e)}")
-        return 1  # Fallback score on error
 def judge_ecolinguistics_from_csv(csv_file):
-    """Existing CSV processing function remains the same"""
-    # [Keep the existing implementation exactly as you have it]
-    # ... (same file processing logic)
-    # ... (same CSV writing logic)
-    # ... (same percentage calculation)
-    return out_path, percentage_display
-# [Keep the Gradio interface configuration exactly as is]
-demo = gr.Interface(
-    fn=judge_ecolinguistics_from_csv,
-    inputs=gr.File(label="Upload CSV with question_number, question, answer"),
-    outputs=[
-        gr.File(label="Download scored CSV"),
-        gr.HTML(label="Percentage Score")
-    ],
-    title="Ecolinguistics Q&A Scoring",
-    description=(
-        "Upload a CSV with columns [question_number, question, answer]. "
-        "DeepSeek scores each answer from 0–5, then shows a final "
-        "percentage score. A detailed CSV with individual scores is provided."
-    )
-)
-if __name__ == "__main__":
-    demo.launch()

 def judge_ecolinguistics_from_csv(csv_file):
+    """
+    Reads CSV of Q&A pairs, scores each,
+    returns a new CSV and a percentage score.
+    """
+    # Read the CSV
+    rows = []
+    with open(csv_file.name, "r", encoding="utf-8") as f:
+        reader = csv.DictReader(f)
+        for r in reader:
+            rows.append(r)
+    results = []
+    total_score = 0
+    # Score each Q&A
+    for r in rows:
+        q_num = r.get("question_number", "")
+        question = r.get("question", "")
+        answer = r.get("answer", "")
+        sc = score_qa(question, answer)
+        total_score += sc
+        results.append({"question_number": q_num, "score": sc})
+    # Write results to a new CSV in a temp file
+    with tempfile.NamedTemporaryFile(mode="w", delete=False, suffix=".csv", encoding="utf-8") as out_file:
+        fieldnames = ["question_number", "score"]
+        writer = csv.DictWriter(out_file, fieldnames=fieldnames)
+        writer.writeheader()
+        for row in results:
+            writer.writerow(row)
+        writer.writerow({"question_number": "Total", "score": total_score})
+        out_path = out_file.name  # This is the critical line
+    # Compute % score: total / (num_questions * 5) * 100
+    num_questions = len(rows)
+    if num_questions > 0:
+        percentage = (total_score / (num_questions * 5)) * 100
+    else:
+        percentage = 0.0
+    percentage_display = f"<h2 style='font-size:2em; color:blue;'>Overall Score: {percentage:.1f}%</h2>"
+    return out_path, percentage_display  # Now out_path is defined