Spaces:

mgbam
/

project-asclepius

Sleeping

App Files Files Community

mgbam commited on 20 days ago

Commit

140d9d4

verified ·

1 Parent(s): 51d35a8

Update modules/orchestrator.py

Browse files

Files changed (1) hide show

modules/orchestrator.py +114 -69

modules/orchestrator.py CHANGED Viewed

@@ -1,103 +1,146 @@
 # modules/orchestrator.py
 """
-The main conductor. This module sequences the calls to APIs and the AI model.
-It contains the core application logic for each feature tab, orchestrating
-data fetching, processing, and AI synthesis.
 """
 import asyncio
 import aiohttp
-import ast
 from itertools import chain
 from PIL import Image
-# Import all our tools
-from . import gemini_handler, prompts
 from .api_clients import (
-    umls_client,
     pubmed_client,
     clinicaltrials_client,
     openfda_client,
     rxnorm_client
 )
-# --- Helper function for formatting data for prompts ---
-def _format_data_for_prompt(data: list | dict, source_name: str) -> str:
-    """Converts API result lists/dicts into a clean string for Gemini prompts."""
-    if not data:
-        return f"No data found from {source_name}."
-    report_lines = [f"--- Data from {source_name} ---"]
-    if isinstance(data, list):
-        for item in data:
-            report_lines.append(str(item))
-    elif isinstance(data, dict):
-        for key, value in data.items():
-            report_lines.append(f"{key}: {value}")
-    return "\n".join(report_lines)
-# --- Main Orchestrator for the Symptom Synthesizer ---
 async def run_symptom_synthesis(user_query: str, image_input: Image.Image | None) -> str:
     """The complete, asynchronous pipeline for the Symptom Synthesizer tab."""
     if not user_query:
         return "Please enter a symptom description or a medical question to begin."
-    # 1. Extract concepts with Gemini
-    term_extraction_prompt = prompts.get_term_extraction_prompt(user_query)
-    concepts_str = await gemini_handler.generate_text_response(term_extraction_prompt)
-    try:
-        concepts = ast.literal_eval(concepts_str)
-        if not isinstance(concepts, list) or not concepts:
-            concepts = [user_query] # Fallback
-    except (ValueError, SyntaxError):
-        concepts = [user_query] # Fallback
-    search_query = " OR ".join(concepts)
-    # 2. Gather all evidence concurrently
     async with aiohttp.ClientSession() as session:
         tasks = {
             "pubmed": pubmed_client.search_pubmed(session, search_query, max_results=3),
             "trials": clinicaltrials_client.find_trials(session, search_query, max_results=3),
-            "openfda": asyncio.gather(*(openfda_client.get_adverse_events(session, c, top_n=3) for c in concepts))
         }
         if image_input:
             tasks["vision"] = gemini_handler.analyze_image_with_text(
-                "Analyze this image in a medical context. Describe what you see objectively. Do not diagnose.", image_input
             )
-        results = await asyncio.gather(*tasks.values(), return_exceptions=True)
-        api_data = dict(zip(tasks.keys(), results))
-    # 3. Format all gathered data for the final prompt
-    pubmed_formatted = _format_data_for_prompt(api_data.get('pubmed'), "PubMed")
-    trials_formatted = _format_data_for_prompt(api_data.get('trials'), "ClinicalTrials.gov")
-    # Flatten the list of lists from the OpenFDA gather call
-    fda_results = list(chain.from_iterable(api_data.get('openfda', [])))
-    fda_formatted = _format_data_for_prompt(fda_results, "OpenFDA Adverse Events")
-    vision_formatted = api_data.get('vision', "")
-    if isinstance(vision_formatted, Exception):
-        vision_formatted = "Error analyzing image."
-    # 4. The Grand Synthesis with Gemini
     synthesis_prompt = prompts.get_synthesis_prompt(
         user_query=user_query,
         concepts=concepts,
-        pubmed_data=pubmed_formatted,
-        trials_data=trials_formatted,
-        fda_data=fda_formatted,
-        vision_analysis=vision_formatted
     )
     final_report = await gemini_handler.generate_text_response(synthesis_prompt)
     return f"{prompts.DISCLAIMER}\n\n{final_report}"
-# --- Main Orchestrator for the Drug Interaction Analyzer ---
 async def run_drug_interaction_analysis(drug_list_str: str) -> str:
     """The complete, asynchronous pipeline for the Drug Interaction Analyzer tab."""
     if not drug_list_str:
@@ -107,16 +150,16 @@ async def run_drug_interaction_analysis(drug_list_str: str) -> str:
     if len(drug_names) < 2:
         return "Please enter at least two medications to check for interactions."
-    # 1. Gather all drug data concurrently
     async with aiohttp.ClientSession() as session:
         tasks = {
             "interactions": rxnorm_client.run_interaction_check(drug_names),
             "safety_profiles": asyncio.gather(*(openfda_client.get_safety_profile(session, name) for name in drug_names))
         }
-        results = await asyncio.gather(*tasks.values(), return_exceptions=True)
-        api_data = dict(zip(tasks.keys(), results))
-    # 2. Format data for the final prompt
     interaction_data = api_data.get('interactions', [])
     if isinstance(interaction_data, Exception):
         interaction_data = [{"error": str(interaction_data)}]
@@ -124,20 +167,22 @@ async def run_drug_interaction_analysis(drug_list_str: str) -> str:
     safety_profiles = api_data.get('safety_profiles', [])
     if isinstance(safety_profiles, Exception):
         safety_profiles = [{"error": str(safety_profiles)}]
-    # Combine safety profiles with their drug names
     safety_data_dict = dict(zip(drug_names, safety_profiles))
-    interaction_formatted = _format_data_for_prompt(interaction_data, "RxNorm Interactions")
-    safety_formatted = _format_data_for_prompt(safety_data_dict, "OpenFDA Safety Profiles")
-    # 3. Synthesize the safety report with Gemini
     synthesis_prompt = prompts.get_drug_interaction_synthesis_prompt(
         drug_names=drug_names,
         interaction_data=interaction_formatted,
         safety_data=safety_formatted
     )
     final_report = await gemini_handler.generate_text_response(synthesis_prompt)
     return f"{prompts.DISCLAIMER}\n\n{final_report}"

 # modules/orchestrator.py
 """
+The Central Nervous System of Project Asclepius.
+This module is the master conductor, orchestrating high-performance, asynchronous
+workflows for each of the application's features. It intelligently sequences
+calls to API clients and the Gemini handler to transform user queries into
+comprehensive, synthesized reports.
 """
 import asyncio
 import aiohttp
 from itertools import chain
 from PIL import Image
+# Import all our specialized tools
+from . import gemini_handler, prompts, utils
 from .api_clients import (
     pubmed_client,
     clinicaltrials_client,
     openfda_client,
     rxnorm_client
+    # The umls_client is implicitly used via term extraction, but can be added for deeper analysis
 )
+# --- Internal Helper for Data Formatting ---
+def _format_api_data_for_prompt(api_results: dict) -> dict[str, str]:
+    """
+    Takes the raw dictionary of API results and formats each entry into a
+    clean, readable string suitable for injection into a Gemini prompt.
+    Args:
+        api_results (dict): The dictionary of results from asyncio.gather.
+    Returns:
+        dict[str, str]: A dictionary with the same keys but formatted string values.
+    """
+    formatted_strings = {}
+    # Format PubMed data
+    pubmed_data = api_results.get('pubmed', [])
+    if isinstance(pubmed_data, list) and pubmed_data:
+        lines = [f"- Title: {a.get('title', 'N/A')} (Journal: {a.get('journal', 'N/A')}, URL: {a.get('url')})" for a in pubmed_data]
+        formatted_strings['pubmed'] = "\n".join(lines)
+    else:
+        formatted_strings['pubmed'] = "No relevant review articles were found on PubMed for this query."
+    # Format Clinical Trials data
+    trials_data = api_results.get('trials', [])
+    if isinstance(trials_data, list) and trials_data:
+        lines = [f"- Title: {t.get('title', 'N/A')} (Status: {t.get('status', 'N/A')}, URL: {t.get('url')})" for t in trials_data]
+        formatted_strings['trials'] = "\n".join(lines)
+    else:
+        formatted_strings['trials'] = "No actively recruiting clinical trials were found matching this query."
+    # Format OpenFDA Adverse Events data
+    # This data often comes from multiple queries, so we flatten it.
+    fda_data = api_results.get('openfda', [])
+    if isinstance(fda_data, list):
+        # The result is a list of lists, so we flatten it
+        all_events = list(chain.from_iterable(filter(None, fda_data)))
+        if all_events:
+            lines = [f"- {evt['term']} (Reported {evt['count']} times)" for evt in all_events]
+            formatted_strings['openfda'] = "\n".join(lines)
+        else:
+            formatted_strings['openfda'] = "No specific adverse event data was found for this query."
+    else:
+        formatted_strings['openfda'] = "No specific adverse event data was found for this query."
+    # Format Vision analysis
+    vision_data = api_results.get('vision', "")
+    if isinstance(vision_data, str) and vision_data:
+        formatted_strings['vision'] = vision_data
+    elif isinstance(vision_data, Exception):
+        formatted_strings['vision'] = f"An error occurred during image analysis: {vision_data}"
+    else:
+        formatted_strings['vision'] = ""
+    return formatted_strings
+# --- FEATURE 1: Symptom Synthesizer Pipeline ---
 async def run_symptom_synthesis(user_query: str, image_input: Image.Image | None) -> str:
     """The complete, asynchronous pipeline for the Symptom Synthesizer tab."""
     if not user_query:
         return "Please enter a symptom description or a medical question to begin."
+    # STEP 1: AI-Powered Concept Extraction
+    # Use Gemini to find the core medical terms in the user's natural language query.
+    term_prompt = prompts.get_term_extraction_prompt(user_query)
+    concepts_str = await gemini_handler.generate_text_response(term_prompt)
+    concepts = utils.safe_literal_eval(concepts_str)
+    if not isinstance(concepts, list) or not concepts:
+        concepts = [user_query]  # Fallback to the raw query if parsing fails
+    # Use "OR" for a broader, more inclusive search across APIs
+    search_query = " OR ".join(f'"{c}"' for c in concepts)
+    # STEP 2: Massively Parallel Evidence Gathering
+    # Launch all API calls concurrently for maximum performance.
     async with aiohttp.ClientSession() as session:
+        # Define the portfolio of data we need to collect
         tasks = {
             "pubmed": pubmed_client.search_pubmed(session, search_query, max_results=3),
             "trials": clinicaltrials_client.find_trials(session, search_query, max_results=3),
+            "openfda": asyncio.gather(*(openfda_client.get_adverse_events(session, c, top_n=3) for c in concepts)),
         }
+        # If an image is provided, add the vision analysis to our task portfolio
         if image_input:
             tasks["vision"] = gemini_handler.analyze_image_with_text(
+                "In the context of the user query, analyze this image objectively. Describe visual features like color, shape, texture, and patterns. Do not diagnose or offer medical advice.", image_input
             )
+        # Execute all tasks and wait for them all to complete
+        raw_results = await asyncio.gather(*tasks.values(), return_exceptions=True)
+        api_data = dict(zip(tasks.keys(), raw_results))
+    # STEP 3: Data Formatting
+    # Convert the raw JSON/list results into clean, prompt-ready strings.
+    formatted_data = _format_api_data_for_prompt(api_data)
+    # STEP 4: The Grand Synthesis
+    # Feed all the structured, evidence-based data into Gemini for the final report generation.
     synthesis_prompt = prompts.get_synthesis_prompt(
         user_query=user_query,
         concepts=concepts,
+        pubmed_data=formatted_data['pubmed'],
+        trials_data=formatted_data['trials'],
+        fda_data=formatted_data['openfda'],
+        vision_analysis=formatted_data['vision']
     )
     final_report = await gemini_handler.generate_text_response(synthesis_prompt)
+    # STEP 5: Final Delivery
+    # Prepend the mandatory disclaimer to the AI-generated report.
     return f"{prompts.DISCLAIMER}\n\n{final_report}"
+# --- FEATURE 2: Drug Interaction & Safety Analyzer Pipeline ---
 async def run_drug_interaction_analysis(drug_list_str: str) -> str:
     """The complete, asynchronous pipeline for the Drug Interaction Analyzer tab."""
     if not drug_list_str:
     if len(drug_names) < 2:
         return "Please enter at least two medications to check for interactions."
+    # STEP 1: Concurrent Drug Data Gathering
     async with aiohttp.ClientSession() as session:
         tasks = {
             "interactions": rxnorm_client.run_interaction_check(drug_names),
             "safety_profiles": asyncio.gather(*(openfda_client.get_safety_profile(session, name) for name in drug_names))
         }
+        raw_results = await asyncio.gather(*tasks.values(), return_exceptions=True)
+        api_data = dict(zip(tasks.keys(), raw_results))
+    # STEP 2: Data Formatting for AI Synthesis
     interaction_data = api_data.get('interactions', [])
     if isinstance(interaction_data, Exception):
         interaction_data = [{"error": str(interaction_data)}]
     safety_profiles = api_data.get('safety_profiles', [])
     if isinstance(safety_profiles, Exception):
         safety_profiles = [{"error": str(safety_profiles)}]
+    # Combine safety profiles with their drug names for clarity in the prompt
     safety_data_dict = dict(zip(drug_names, safety_profiles))
+    # Format the complex data into clean strings
+    interaction_formatted = utils.format_list_as_markdown([str(i) for i in interaction_data]) if interaction_data else "No interactions found."
+    safety_formatted = "\n".join([f"Profile for {drug}: {profile}" for drug, profile in safety_data_dict.items()])
+    # STEP 3: AI-Powered Safety Briefing
     synthesis_prompt = prompts.get_drug_interaction_synthesis_prompt(
         drug_names=drug_names,
         interaction_data=interaction_formatted,
         safety_data=safety_formatted
     )
     final_report = await gemini_handler.generate_text_response(synthesis_prompt)
+    # STEP 4: Final Delivery
     return f"{prompts.DISCLAIMER}\n\n{final_report}"