Spaces:

m-ric
/

predibench-backend

Running

App Files Files Community

M-Rique commited on 5 days ago

Commit

43aad2c

0 Parent(s):

First commit

Browse files

Files changed (2) hide show

app.py +278 -0
requirements.txt +6 -0

app.py ADDED Viewed

	@@ -0,0 +1,278 @@

+import os
+import textwrap
+from datetime import date, datetime, timedelta
+import gradio as gr
+import pandas as pd
+from apscheduler.schedulers.background import BackgroundScheduler
+from datasets import Dataset
+from dotenv import load_dotenv
+from huggingface_hub import HfApi
+from predibench.agent.agent import run_smolagent
+from predibench.polymarket_api import (
+    MarketRequest,
+    filter_interesting_questions,
+    filter_out_resolved_markets,
+    get_open_markets,
+)
+load_dotenv()
+# Configuration
+WEEKLY_MARKETS_REPO = "m-ric/predibench-weekly-markets"
+AGENT_CHOICES_REPO = "m-ric/predibench-agent-choices"
+N_MARKETS = 10
+def restart_space():
+    """Restart the HuggingFace space"""
+    try:
+        HfApi(token=os.getenv("HF_TOKEN", None)).restart_space(
+            repo_id="m-ric/predibench-backend"  # Update with your actual space repo
+        )
+        print(f"Space restarted on {datetime.now()}")
+    except Exception as e:
+        print(f"Failed to restart space: {e}")
+def get_top_polymarket_questions(n_markets: int = 10) -> list:
+    """Fetch top questions from Polymarket API"""
+    end_date = date.today() + timedelta(days=7)
+    request = MarketRequest(
+        limit=n_markets * 10,
+        active=True,
+        closed=False,
+        order="volumeNum",
+        ascending=False,
+        end_date_min=end_date,
+        end_date_max=end_date + timedelta(days=21),
+    )
+    markets = get_open_markets(request)
+    markets = filter_out_resolved_markets(markets)
+    # Filter for interesting questions
+    interesting_questions = filter_interesting_questions(
+        [market.question for market in markets]
+    )
+    markets = [market for market in markets if market.question in interesting_questions]
+    return markets[:n_markets]
+def upload_weekly_markets(markets: list):
+    """Upload weekly markets to HuggingFace dataset"""
+    markets_data = []
+    for market in markets:
+        markets_data.append(
+            {
+                "id": market.id,
+                "question": market.question,
+                "slug": market.slug,
+                "description": market.description,
+                "end_date": market.end_date,
+                "active": market.active,
+                "closed": market.closed,
+                "volume": market.volume,
+                "liquidity": market.liquidity,
+                "week_selected": date.today().strftime("%Y-%m-%d"),
+                "timestamp": datetime.now(),
+            }
+        )
+    df = pd.DataFrame(markets_data)
+    dataset = Dataset.from_pandas(df)
+    try:
+        # Try to load existing dataset and append
+        existing_dataset = Dataset.from_parquet(f"hf://datasets/{WEEKLY_MARKETS_REPO}")
+        combined_dataset = existing_dataset.concatenate(dataset)
+        combined_dataset.push_to_hub(WEEKLY_MARKETS_REPO, private=False)
+    except:
+        # If no existing dataset, create new one
+        dataset.push_to_hub(WEEKLY_MARKETS_REPO, private=False)
+    print(f"Uploaded {len(markets_data)} markets to {WEEKLY_MARKETS_REPO}")
+def run_agent_decisions(markets: list, model_ids: list = None):
+    """Run agent decision-making logic on the selected markets"""
+    if model_ids is None:
+        model_ids = [
+            "gpt-4o",
+            "gpt-4.1",
+            "anthropic/claude-sonnet-4-20250514",
+            "huggingface/Qwen/Qwen3-30B-A3B-Instruct-2507",
+        ]
+    today = date.today()
+    decisions = []
+    for model_id in model_ids:
+        for market in markets:
+            # Create the investment decision prompt
+            full_question = textwrap.dedent(
+                f"""Let's say we are the {today.strftime("%B %d, %Y")}.
+                Please answer the below question by yes or no. But first, run a detailed analysis.
+                Here is the question:
+                {market.question}
+                More details:
+                {market.description}
+                Invest in yes only if you think the yes is underrated, and invest in no only if you think that the yes is overrated.
+                What would you decide: buy yes, buy no, or do nothing?
+                """
+            )
+            try:
+                response = run_smolagent(model_id, full_question, cutoff_date=today)
+                choice = response.output.lower()
+                # Standardize choice format
+                if "yes" in choice:
+                    choice_standardized = 1
+                    choice_raw = "yes"
+                elif "no" in choice:
+                    choice_standardized = -1
+                    choice_raw = "no"
+                else:
+                    choice_standardized = 0
+                    choice_raw = "nothing"
+                decisions.append(
+                    {
+                        "agent_name": f"smolagent_{model_id}".replace("/", "--"),
+                        "date": today,
+                        "question": market.question,
+                        "question_id": market.id,
+                        "choice": choice_standardized,
+                        "choice_raw": choice_raw,
+                        "messages_count": len(response.messages),
+                        "has_reasoning": len(response.messages) > 0,
+                        "timestamp": datetime.now(),
+                    }
+                )
+                print(f"Completed decision for {model_id} on {market.question[:50]}...")
+            except Exception as e:
+                print(f"Error processing {model_id} on {market.question[:50]}: {e}")
+                continue
+    return decisions
+def upload_agent_choices(decisions: list):
+    """Upload agent choices to HuggingFace dataset"""
+    df = pd.DataFrame(decisions)
+    dataset = Dataset.from_pandas(df)
+    try:
+        # Try to load existing dataset and append
+        existing_dataset = Dataset.from_parquet(f"hf://datasets/{AGENT_CHOICES_REPO}")
+        combined_dataset = existing_dataset.concatenate(dataset)
+        combined_dataset.push_to_hub(AGENT_CHOICES_REPO, private=False)
+    except:
+        # If no existing dataset, create new one
+        dataset.push_to_hub(AGENT_CHOICES_REPO, private=False)
+    print(f"Uploaded {len(decisions)} agent decisions to {AGENT_CHOICES_REPO}")
+def weekly_pipeline():
+    """Main weekly pipeline that runs every Sunday"""
+    print(f"Starting weekly pipeline at {datetime.now()}")
+    try:
+        # 1. Get top 10 questions from Polymarket
+        markets = get_top_polymarket_questions(N_MARKETS)
+        print(f"Retrieved {len(markets)} markets from Polymarket")
+        # 2. Upload to weekly markets dataset
+        upload_weekly_markets(markets)
+        # 3. Run agent decision-making
+        decisions = run_agent_decisions(markets)
+        print(f"Generated {len(decisions)} agent decisions")
+        # 4. Upload agent choices
+        upload_agent_choices(decisions)
+        print("Weekly pipeline completed successfully")
+    except Exception as e:
+        print(f"Weekly pipeline failed: {e}")
+# Set up scheduler to run every Sunday at 8:30 AM
+scheduler = BackgroundScheduler()
+scheduler.add_job(restart_space, "cron", day_of_week="sun", hour=8, minute=0)
+scheduler.add_job(weekly_pipeline, "cron", day_of_week="sun", hour=8, minute=30)
+scheduler.start()
+# Simple Gradio interface for monitoring
+def get_status():
+    """Get current status of the backend"""
+    try:
+        # Check if datasets exist and get their info
+        api = HfApi()
+        weekly_info = "Not available"
+        choices_info = "Not available"
+        try:
+            weekly_dataset = Dataset.from_parquet(
+                f"hf://datasets/{WEEKLY_MARKETS_REPO}"
+            )
+            weekly_info = f"{len(weekly_dataset)} markets"
+        except:
+            pass
+        try:
+            choices_dataset = Dataset.from_parquet(
+                f"hf://datasets/{AGENT_CHOICES_REPO}"
+            )
+            choices_info = f"{len(choices_dataset)} decisions"
+        except:
+            pass
+        return f"""
+        Backend Status (Last updated: {datetime.now()})
+        Weekly Markets Dataset: {weekly_info}
+        Agent Choices Dataset: {choices_info}
+        Next scheduled run: Next Sunday at 8:30 AM UTC
+        """
+    except Exception as e:
+        return f"Error getting status: {e}"
+def manual_run():
+    """Manually trigger the weekly pipeline"""
+    weekly_pipeline()
+    return "Manual pipeline run completed. Check logs for details."
+# Create Gradio interface
+with gr.Blocks(title="PrediBench Backend") as demo:
+    gr.Markdown("# PrediBench Backend Monitor")
+    gr.Markdown(
+        "This backend automatically fetches new Polymarket questions every Sunday and runs agent predictions."
+    )
+    with gr.Row():
+        status_text = gr.Textbox(label="Status", value=get_status(), lines=10)
+        refresh_btn = gr.Button("Refresh Status")
+        refresh_btn.click(get_status, outputs=status_text)
+    with gr.Row():
+        manual_btn = gr.Button("Run Manual Pipeline", variant="primary")
+        manual_output = gr.Textbox(label="Manual Run Output", lines=5)
+        manual_btn.click(manual_run, outputs=manual_output)
+if __name__ == "__main__":
+    print("Starting PrediBench backend...")
+    demo.launch(server_name="0.0.0.0", server_port=7860)

requirements.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+gradio
+datasets
+huggingface_hub
+apscheduler
+python-dotenv
+git+https://github.com/m-ric/predibench-core