Spaces:

GuglielmoTor
/

LinkedinMonitor

Running

App Files Files Community

GuglielmoTor commited on 18 days ago

Commit

0cfca76

verified ·

1 Parent(s): 5b325ca

Update run_agentic_pipeline.py

Browse files

Files changed (1) hide show

run_agentic_pipeline.py +129 -77

run_agentic_pipeline.py CHANGED Viewed

@@ -1,106 +1,158 @@
-# run_agentic_pipeline.py
-"""
-This module is responsible for loading and displaying pre-computed AI analysis
-results (reports and OKRs) that have been fetched from Bubble.io. It does not
-perform any new analysis.
-"""
-import logging
 import gradio as gr
-# UI formatting and data reconstruction functions are still needed
 try:
     from ui.insights_ui_generator import (
-        format_report_to_markdown,
         extract_key_results_for_selection,
         format_single_okr_for_display
     )
-    from services.report_data_handler import fetch_and_reconstruct_data_from_bubble
     AGENTIC_MODULES_LOADED = True
 except ImportError as e:
     logging.error(f"Could not import agentic pipeline display modules: {e}. Tabs 3 and 4 will be disabled.")
     AGENTIC_MODULES_LOADED = False
-    # Define placeholder functions if imports fail
-    def format_report_to_markdown(report_string): return "Agentic modules not loaded. Report unavailable."
     def extract_key_results_for_selection(okrs_dict): return []
     def format_single_okr_for_display(okr_data, **kwargs): return "Agentic modules not loaded. OKR display unavailable."
-    def fetch_and_reconstruct_data_from_bubble(df): return None
-def load_and_display_agentic_results(current_token_state, orchestration_raw_results_st, selected_key_result_ids_st, key_results_for_selection_st):
     """
-    Loads pre-computed agentic analysis and OKR data from the application state
-    (which was fetched from Bubble) and formats it for display in the Gradio UI.
     """
-    logging.info("Loading and displaying pre-computed agentic results from state.")
-    # A tuple of Gradio updates to return in case of errors or no data
-    initial_yield_updates = (
-        gr.update(value="Nessun dato di analisi trovato..."),             # agentic_report_display_md
-        gr.update(choices=[], value=[], interactive=False),          # key_results_cbg
-        gr.update(value="Nessun OKR trovato..."),                      # okr_detail_display_md
-        None,                                                         # orchestration_raw_results_st
-        [],                                                           # selected_key_result_ids_st
-        [],                                                           # key_results_for_selection_st
-        "Stato: In attesa di dati"                                    # agentic_pipeline_status_md
     )
     if not AGENTIC_MODULES_LOADED:
-        logging.warning("Agentic display modules not loaded. Cannot display results.")
-        error_updates = list(initial_yield_updates)
-        error_updates[-1] = "Errore: Moduli AI non caricati."
         return tuple(error_updates)
-    # The raw DataFrame fetched from Bubble's agentic analysis table
-    agentic_data_df = current_token_state.get('bubble_agentic_analysis_data')
-    if agentic_data_df is None or agentic_data_df.empty:
-        logging.warning("No agentic analysis data found in the application state.")
-        return initial_yield_updates
-    # Use the handler to reconstruct the report and OKRs from the DataFrame
-    reconstructed_data = fetch_and_reconstruct_data_from_bubble(agentic_data_df)
-    if not reconstructed_data:
-        logging.warning("Could not reconstruct agentic data from the fetched DataFrame.")
-        error_updates = list(initial_yield_updates)
-        error_updates[0] = gr.update(value="I dati di analisi esistenti non sono nel formato corretto.")
-        error_updates[2] = gr.update(value="Impossibile visualizzare gli OKR.")
-        error_updates[-1] = "Stato: Errore formato dati"
-        return tuple(error_updates)
-    # --- Prepare UI updates with the reconstructed data ---
-    report_str = reconstructed_data.get('report_str', "Nessun report di analisi trovato nei dati.")
-    actionable_okrs = reconstructed_data.get('actionable_okrs') # This is the dict with 'okrs' list
-    # 1. Update Report Tab
-    agentic_report_md_update = gr.update(value=format_report_to_markdown(report_str))
-    # 2. Update OKR Tab components
-    if actionable_okrs and isinstance(actionable_okrs.get("okrs"), list):
-        krs_for_ui_selection_list = extract_key_results_for_selection(actionable_okrs)
-        kr_choices_for_cbg = [(kr['kr_description'], kr['unique_kr_id']) for kr in krs_for_ui_selection_list]
-        key_results_cbg_update = gr.update(choices=kr_choices_for_cbg, value=[], interactive=True)
-        krs_for_selection_state_update = krs_for_ui_selection_list
-        all_okrs_md_parts = [
-            format_single_okr_for_display(okr_item, accepted_kr_indices=None, okr_main_index=okr_idx)
-            for okr_idx, okr_item in enumerate(actionable_okrs["okrs"])
-        ]
-        okr_detail_display_md_update = gr.update(value="\n\n---\n\n".join(all_okrs_md_parts))
-    else:
-        # Handle case where there are no OKRs in the data
-        krs_for_selection_state_update = []
-        key_results_cbg_update = gr.update(choices=[], value=[], interactive=False)
-        okr_detail_display_md_update = gr.update(value="Nessun OKR trovato nei dati di analisi caricati.")
-    # Return all the final updates for the Gradio interface
-    return (
-        agentic_report_md_update,
-        key_results_cbg_update,
-        okr_detail_display_md_update,
-        reconstructed_data,          # Store the full reconstructed data dict in the state
-        [],                          # Reset the selected KR IDs state
-        krs_for_selection_state_update, # Update the state with all available KRs
-        "Stato: Dati di analisi caricati correttamente da Bubble" # Final status message
-    )

 import gradio as gr
+import pandas as pd
+import json
+import logging
+from typing import Dict, Any, List, Optional
+# Assuming these functions are in ui.insights_ui_generator
+# Make sure to have this file updated with the new `format_report_for_display` function
 try:
     from ui.insights_ui_generator import (
+        format_report_for_display,
         extract_key_results_for_selection,
         format_single_okr_for_display
     )
     AGENTIC_MODULES_LOADED = True
 except ImportError as e:
     logging.error(f"Could not import agentic pipeline display modules: {e}. Tabs 3 and 4 will be disabled.")
     AGENTIC_MODULES_LOADED = False
+    def format_report_for_display(report_data): return "Agentic modules not loaded. Report unavailable."
     def extract_key_results_for_selection(okrs_dict): return []
     def format_single_okr_for_display(okr_data, **kwargs): return "Agentic modules not loaded. OKR display unavailable."
+logger = logging.getLogger(__name__)
+def load_and_display_agentic_results(
+    token_state: dict,
+    orchestration_raw_results_st: Optional[dict],
+    selected_key_result_ids_st: List[str],
+    key_results_for_selection_st: List[dict]
+):
     """
+    Loads pre-computed agentic results from the state, populates the report library dropdown,
+    and displays the latest report and its associated OKRs by default.
+    This function is designed to work with the UI defined in app.py and expects a specific
+    order of outputs.
+    Args:
+        token_state: The main state dictionary containing the bubble_agentic_analysis_data DataFrame.
+        orchestration_raw_results_st: The state holding the raw JSON/dict of the currently displayed report.
+        selected_key_result_ids_st: The state for the IDs of selected Key Results.
+        key_results_for_selection_st: The state holding the list of all available Key Results for selection.
+    Returns:
+        A tuple of Gradio updates matching the `agentic_display_outputs` list in `app.py`.
     """
+    # Default empty/initial return values that match the output components list
+    # The order is critical:
+    # 1. agentic_report_display_md
+    # 2. report_selector_dd
+    # 3. key_results_cbg
+    # 4. okr_detail_display_md
+    # 5. orchestration_raw_results_st
+    # 6. selected_key_result_ids_st
+    # 7. key_results_for_selection_st
+    # 8. agentic_pipeline_status_md
+    initial_updates = (
+        "No agentic analysis data found in Bubble.",
+        gr.update(choices=[], value=None, interactive=False),
+        gr.update(choices=[], value=[], interactive=False),
+        "No OKRs to display.",
+        None,
+        [],
+        [],
+        "Status: No agentic analysis data found."
     )
     if not AGENTIC_MODULES_LOADED:
+        error_updates = list(initial_updates)
+        error_updates[7] = "Status: Critical module import error."
         return tuple(error_updates)
+    agentic_df = token_state.get("bubble_agentic_analysis_data")
+    if agentic_df is None or agentic_df.empty:
+        logger.warning("Agentic analysis DataFrame is missing or empty in the state.")
+        return initial_updates
+    try:
+        # --- 1. Prepare Report Library ---
+        if 'Created Date' not in agentic_df.columns or '_id' not in agentic_df.columns:
+            raise KeyError("Required columns ('Created Date', '_id') not found in agentic data.")
+        # Ensure 'Created Date' is datetime, then sort to get the latest report first
+        agentic_df['Created Date'] = pd.to_datetime(agentic_df['Created Date'])
+        agentic_df = agentic_df.sort_values(by='Created Date', ascending=False).reset_index(drop=True)
+        # Create choices for the dropdown: (Display Name, Unique ID)
+        report_choices = [
+            (f"{row.get('report_type', 'Report')} - {row['Created Date'].strftime('%Y-%m-%d %H:%M')}", row['_id'])
+            for _, row in agentic_df.iterrows()
+        ]
+        if not report_choices:
+            return initial_updates
+        # --- 2. Load and Display the Latest Report by Default ---
+        latest_report_series = agentic_df.iloc[0]
+        latest_report_id = latest_report_series['_id']
+        # Format the latest report's content for the Markdown display
+        report_display_md = format_report_for_display(latest_report_series)
+        # Create the update for the report library dropdown
+        report_selector_update = gr.update(choices=report_choices, value=latest_report_id, interactive=True)
+        # --- 3. Load and Prepare OKRs from the Latest Report ---
+        raw_results_state = None
+        okr_details_md = "No OKRs found in the latest report."
+        key_results_cbg_update = gr.update(choices=[], value=[], interactive=False)
+        all_krs_state = []
+        # Assumption: The full JSON from the agent is stored in 'orchestration_results'.
+        if 'orchestration_results' in latest_report_series and pd.notna(latest_report_series['orchestration_results']):
+            try:
+                raw_results_state = json.loads(latest_report_series['orchestration_results'])
+            except json.JSONDecodeError:
+                logger.error(f"Failed to parse 'orchestration_results' JSON for report ID {latest_report_id}")
+                raw_results_state = {} # Avoid crashing, proceed with empty data
+        else:
+            raw_results_state = {}
+        actionable_okrs_dict = raw_results_state.get("actionable_okrs", {})
+        if actionable_okrs_dict:
+            all_krs_state = extract_key_results_for_selection(actionable_okrs_dict)
+            if all_krs_state:
+                kr_choices = [(kr['kr_description'], kr['unique_kr_id']) for kr in all_krs_state]
+                key_results_cbg_update = gr.update(choices=kr_choices, value=[], interactive=True)
+                # Format all OKRs for initial display
+                okrs_list = actionable_okrs_dict.get("okrs", [])
+                output_md_parts = [
+                    format_single_okr_for_display(okr_data, okr_main_index=okr_idx)
+                    for okr_idx, okr_data in enumerate(okrs_list)
+                ]
+                okr_details_md = "\n\n---\n\n".join(output_md_parts) if output_md_parts else okr_details_md
+        status_update = f"Status: Loaded {len(agentic_df)} reports. Displaying the latest from {latest_report_series['Created Date'].strftime('%Y-%m-%d')}."
+        return (
+            report_display_md,
+            report_selector_update,
+            key_results_cbg_update,
+            okr_details_md,
+            raw_results_state,
+            [], # Reset selected KRs
+            all_krs_state,
+            status_update
+        )
+    except Exception as e:
+        logger.error(f"Failed to process and display agentic results: {e}", exc_info=True)
+        error_updates = list(initial_updates)
+        error_updates[0] = f"An error occurred while loading reports: {e}"
+        error_updates[7] = f"Status: Error - {e}"
+        return tuple(error_updates)