Spaces:

GuglielmoTor
/

LinkedinMonitor

Running

App Files Files Community

GuglielmoTor commited on Jun 4

Commit

896e49e

verified ·

1 Parent(s): 11f6ec0

Update features/insight_and_tasks/agents/task_extraction_agent.py

Browse files

Files changed (1) hide show

features/insight_and_tasks/agents/task_extraction_agent.py +232 -235

features/insight_and_tasks/agents/task_extraction_agent.py CHANGED Viewed

@@ -1,68 +1,63 @@
 # agents/task_extraction_agent.py
 import logging
-import json
 from typing import Optional
-from datetime import datetime, date
 from google.adk.agents import LlmAgent
-from google.adk.runners import InMemoryRunner
-from google.genai import types as genai_types
 # Project-specific imports
 from features.insight_and_tasks.data_models.tasks import (
-    TaskExtractionOutput,
-    OKR,
-    KeyResult,
-    Task,
-    EffortLevel,
-    TimelineCategory,
-    PriorityLevel,
-    TaskType,
-    DataSubject
 )
-from features.insight_and_tasks.utils.retry_mechanism import RetryMechanism
 # Configure logger for this module
 logger = logging.getLogger(__name__)
-DEFAULT_AGENT_MODEL = "gemini-2.5-flash-preview-05-20"
 class TaskExtractionAgent:
     """
     Agent specialized in extracting actionable tasks and OKRs from analysis insights,
     with awareness of the current date and quarter.
     """
     AGENT_NAME = "task_extractor"
     AGENT_DESCRIPTION = "Specialist in converting strategic insights into specific, time-aware actionable tasks and OKRs."
     def __init__(self, api_key: str, model_name: Optional[str] = None, current_date: Optional[date] = None):
         """
         Initializes the TaskExtractionAgent.
         Args:
             api_key: API key (may be used by LlmAgent configuration or future needs).
             model_name: Name of the language model to use.
             current_date: The current date to use for quarter calculations. Defaults to today.
         """
-        self.api_key = api_key
         self.model_name = model_name or DEFAULT_AGENT_MODEL
-        self.current_date = current_date or datetime.utcnow().date()
         # LlmAgent is initialized with dynamic instruction and output schema
         self.agent = LlmAgent(
             name=self.AGENT_NAME,
             model=self.model_name,
             description=self.AGENT_DESCRIPTION,
-            instruction=self._get_instruction_prompt(),
-            output_schema=TaskExtractionOutput,
-            output_key="extracted_tasks_okrs"
         )
-        self.retry_mechanism = RetryMechanism()
         logger.info(f"{self.AGENT_NAME} initialized for Q{self._get_quarter(self.current_date)}, "
-                   f"{self._days_until_quarter_end(self.current_date)} days remaining in quarter. Model: {self.model_name}")
     def _get_quarter(self, d: date) -> int:
         """Calculates the quarter for a given date."""
@@ -72,7 +67,6 @@ class TaskExtractionAgent:
         """Calculates the number of days remaining in the current quarter from date d."""
         current_q = self._get_quarter(d)
         year = d.year
         if current_q == 1:
             quarter_end_date = date(year, 3, 31)
         elif current_q == 2:
@@ -83,26 +77,46 @@ class TaskExtractionAgent:
             quarter_end_date = date(year, 12, 31)
         days_remaining = (quarter_end_date - d).days
-        return max(0, days_remaining)
     def _get_instruction_prompt(self) -> str:
         """Generates the dynamic instruction string for the LlmAgent."""
         quarter = self._get_quarter(self.current_date)
         days_remaining = self._days_until_quarter_end(self.current_date)
         return f"""
-You are a Time-Aware Task Extraction Specialist. Your role is to analyze strategic insights from LinkedIn analytics and create structured OKRs with actionable tasks.
-## CURRENT CONTEXT (CRITICAL - USE EXACTLY AS SPECIFIED):
-- Current Quarter: Q{quarter}
-- Days remaining in current quarter: {days_remaining}
-- Today's Date: {self.current_date.isoformat()}
-- Required current_quarter_info format: "Q{quarter}, {days_remaining} days remaining"
-## MANDATORY OUTPUT STRUCTURE:
-You MUST return a complete JSON object with this exact structure:
-```json
 {{
   "current_quarter_info": "Q{quarter}, {days_remaining} days remaining",
   "okrs": [
@@ -139,7 +153,6 @@ You MUST return a complete JSON object with this exact structure:
   "overall_strategic_focus": "Summary of main strategic themes",
   "generation_timestamp": "{datetime.utcnow().isoformat()}"
 }}
-```
 ## CRITICAL REQUIREMENTS:
@@ -185,164 +198,44 @@ Given {days_remaining} days left in Q{quarter}:
 - High: Critical for quarter goals, high impact, urgent
 - Medium: Important but not critical, moderate impact
 - Low: Nice to have, low impact, can be delayed
-## VALIDATION CHECKLIST:
-Before submitting your response, verify:
-□ JSON is valid and complete
-□ current_quarter_info matches exact format required
-□ Every OKR has 2-4 key results
-□ Every key result has 2-5 tasks with ALL required fields
-□ All enum values match exactly (case-sensitive)
-□ All tasks have clear connection to analysis in why_proposed
-□ Target metrics and values are specific and measurable
-□ Timeline assignments are realistic for remaining quarter days
-## ERROR PREVENTION:
-- Double-check all field names match the schema exactly
-- Ensure no null values where fields are required
-- Verify all enum values are spelled correctly
-- Make sure every key result has tasks (never empty array)
-- Confirm JSON syntax is valid
-Your response must be ONLY the JSON object, no additional text or formatting.
-"""
-    def _validate_extracted_data(self, data: dict) -> bool:
-        """
-        Validates the extracted data structure before creating TaskExtractionOutput.
-        Args:
-            data: Dictionary containing extracted data
-        Returns:
-            bool: True if data is valid, False otherwise
         """
-        try:
-            # Check required top-level fields
-            if not isinstance(data.get('okrs'), list):
-                logger.error("Missing or invalid 'okrs' field")
-                return False
-            if not data.get('current_quarter_info'):
-                logger.error("Missing 'current_quarter_info' field")
-                return False
-            # Validate each OKR
-            for i, okr in enumerate(data['okrs']):
-                if not isinstance(okr.get('key_results'), list) or len(okr.get('key_results', [])) == 0:
-                    logger.error(f"OKR {i} has empty or missing key_results")
-                    return False
-                # Validate each key result
-                for j, kr in enumerate(okr['key_results']):
-                    if not isinstance(kr.get('tasks'), list) or len(kr.get('tasks', [])) == 0:
-                        logger.error(f"OKR {i}, Key Result {j} has empty or missing tasks")
-                        return False
-                    # Validate each task has required fields
-                    for k, task in enumerate(kr['tasks']):
-                        required_fields = [
-                            'task_category', 'task_description', 'objective_deliverable',
-                            'effort', 'timeline', 'responsible_party', 'success_criteria_metrics',
-                            'priority', 'priority_justification', 'why_proposed', 'task_type'
-                        ]
-                        for field in required_fields:
-                            if not task.get(field):
-                                logger.error(f"Task {k} in OKR {i}, KR {j} missing required field: {field}")
-                                return False
-            return True
-        except Exception as e:
-            logger.error(f"Error validating extracted data: {e}")
-            return False
-    def _create_fallback_output(self, analysis_summary: str = "") -> TaskExtractionOutput:
-        """Creates a fallback output with at least one complete OKR structure."""
-        quarter = self._get_quarter(self.current_date)
-        days_remaining = self._days_until_quarter_end(self.current_date)
-        fallback_task = Task(
-            task_category="Analysis Review",
-            task_description="Conduct comprehensive review of LinkedIn analytics insights",
-            objective_deliverable="Complete analysis review report with actionable recommendations",
-            effort=EffortLevel.MEDIUM,
-            timeline=TimelineCategory.SHORT_TERM,
-            responsible_party="Social Media Manager",
-            success_criteria_metrics="Review completed within 1 week, 3+ actionable insights identified",
-            dependencies_prerequisites=None,
-            priority=PriorityLevel.HIGH,
-            priority_justification="Required to understand current performance and identify improvement areas",
-            why_proposed="Based on provided comprehensive analysis requiring strategic review",
-            task_type=TaskType.INITIATIVE,
-            data_subject=DataSubject.GENERAL
-        )
-        fallback_key_result = KeyResult(
-            key_result_description="Complete strategic analysis review and identify improvement opportunities",
-            target_metric="Analysis Completion Rate",
-            target_value="100% within 1 week",
-            tasks=[fallback_task]
-        )
-        fallback_okr = OKR(
-            objective_description="Establish baseline understanding of current LinkedIn performance",
-            key_results=[fallback_key_result],
-            objective_timeline=TimelineCategory.SHORT_TERM,
-            objective_owner="Social Media Team"
-        )
-        return TaskExtractionOutput(
-            current_quarter_info=f"Q{quarter}, {days_remaining} days remaining",
-            okrs=[fallback_okr],
-            overall_strategic_focus=f"Focus on analysis review and strategic planning. {analysis_summary}".strip(),
-            generation_timestamp=datetime.utcnow().isoformat()
-        )
     async def extract_tasks(self, comprehensive_analysis: str) -> TaskExtractionOutput:
         """
         Extracts time-aware actionable tasks from the comprehensive analysis text.
         Args:
             comprehensive_analysis: The text analysis from which to extract tasks.
         Returns:
             A TaskExtractionOutput Pydantic model instance.
         """
         if not comprehensive_analysis or not comprehensive_analysis.strip():
             logger.warning("Comprehensive analysis text is empty. Cannot extract tasks.")
-            return self._create_fallback_output("No analysis provided")
-        # Create more structured prompt
-        quarter = self._get_quarter(self.current_date)
-        days_remaining = self._days_until_quarter_end(self.current_date)
         prompt_for_adk_agent = f"""
-ANALYSIS TO PROCESS:
-{comprehensive_analysis}
-INSTRUCTIONS:
-Based on the analysis above, create OKRs following the exact JSON structure specified in your system instructions.
-CRITICAL REMINDERS:
-- current_quarter_info must be exactly: "Q{quarter}, {days_remaining} days remaining"
-- Every OKR must have 2-4 key results
-- Every key result must have 2-5 tasks
-- All tasks must include ALL required fields
-- All enum values must match exactly (case-sensitive)
-- Response must be ONLY valid JSON, no additional text
-Generate the complete JSON structure now:
-"""
         user_input_content = genai_types.Content(
             role="user",
             parts=[genai_types.Part(text=prompt_for_adk_agent)]
         )
-        # Using InMemoryRunner for LlmAgent
         runner = InMemoryRunner(agent=self.agent, app_name=f"{self.AGENT_NAME}Runner")
         user_id = f"system_user_task_extractor_{int(datetime.utcnow().timestamp())}"
         session = await runner.session_service.create_session(
@@ -351,19 +244,21 @@ Generate the complete JSON structure now:
         )
         extracted_data_dict = None
-        full_response_text_for_debug = ""
         try:
             logger.info(f"Running TaskExtractionAgent for user_id: {user_id}, session_id: {session.id}")
             run_result = runner.run(
                 user_id=user_id,
                 session_id=session.id,
                 new_message=user_input_content
             )
-            # Handle both async and sync iterators
             if hasattr(run_result, '__aiter__'):
                 async for event in run_result:
                     if (hasattr(event, 'actions') and event.actions and
                         hasattr(event.actions, 'state_delta') and
@@ -371,15 +266,16 @@ Generate the complete JSON structure now:
                         self.agent.output_key in event.actions.state_delta):
                         extracted_data_dict = event.actions.state_delta[self.agent.output_key]
-                        logger.info("Successfully extracted structured data via LlmAgent state_delta.")
                         break
-                    # Capture text for debugging
                     if hasattr(event, 'content') and event.content and event.content.parts:
                         for part in event.content.parts:
                             if hasattr(part, 'text'):
-                                full_response_text_for_debug += part.text
             else:
                 for event in run_result:
                     if (hasattr(event, 'actions') and event.actions and
                         hasattr(event.actions, 'state_delta') and
@@ -387,70 +283,171 @@ Generate the complete JSON structure now:
                         self.agent.output_key in event.actions.state_delta):
                         extracted_data_dict = event.actions.state_delta[self.agent.output_key]
-                        logger.info("Successfully extracted structured data via LlmAgent state_delta.")
                         break
-                    # Capture text for debugging
                     if hasattr(event, 'content') and event.content and event.content.parts:
                         for part in event.content.parts:
                             if hasattr(part, 'text'):
-                                full_response_text_for_debug += part.text
-            # If no structured output, try parsing the text response
             if not extracted_data_dict and full_response_text_for_debug:
-                logger.info("Attempting to parse JSON from text response")
-                try:
-                    # Clean the response text
-                    cleaned_text = full_response_text_for_debug.strip()
-                    if cleaned_text.startswith('```json'):
-                        cleaned_text = cleaned_text[7:]
-                    if cleaned_text.endswith('```'):
-                        cleaned_text = cleaned_text[:-3]
-                    parsed_json = json.loads(cleaned_text)
-                    if self._validate_extracted_data(parsed_json):
-                        extracted_data_dict = parsed_json
-                        logger.info("Successfully parsed and validated JSON from text response")
-                    else:
-                        logger.warning("Parsed JSON failed validation")
-                except json.JSONDecodeError as je:
-                    logger.error(f"Failed to parse JSON from text response: {je}")
-                    logger.error(f"Raw response (first 1000 chars): {full_response_text_for_debug[:1000]}")
         except Exception as e:
             logger.error(f"Error during TaskExtractionAgent execution: {e}", exc_info=True)
         finally:
             try:
                 await runner.session_service.delete_session(
-                    app_name=f"{self.AGENT_NAME}Runner",
-                    user_id=user_id,
-                    session_id=session.id
                 )
             except Exception as session_del_e:
                 logger.error(f"Error deleting task extractor session: {session_del_e}")
-        # Process the extracted data
         if extracted_data_dict:
-            try:
-                if isinstance(extracted_data_dict, TaskExtractionOutput):
-                    return extracted_data_dict
-                elif isinstance(extracted_data_dict, dict):
-                    # Validate before creating the model
-                    if self._validate_extracted_data(extracted_data_dict):
-                        return TaskExtractionOutput(**extracted_data_dict)
-                    else:
-                        logger.error("Extracted data failed validation, using fallback")
-                        return self._create_fallback_output("Invalid extracted data structure")
-                else:
-                    logger.error(f"Extracted data is unexpected type: {type(extracted_data_dict)}")
-                    return self._create_fallback_output("Unexpected data type")
-            except Exception as pydantic_error:
-                logger.error(f"Error parsing extracted dictionary into TaskExtractionOutput: {pydantic_error}", exc_info=True)
-                logger.error(f"Problematic dictionary data: {extracted_data_dict}")
-                return self._create_fallback_output("Pydantic parsing error")
         # Fallback if no valid data extracted
-        logger.warning("No valid structured data extracted by TaskExtractionAgent, using fallback")
-        return self._create_fallback_output("No structured data extracted")

 # agents/task_extraction_agent.py
 import logging
 from typing import Optional
+from datetime import datetime, date # Ensure date is imported if used for type hints
 from google.adk.agents import LlmAgent
+from google.adk.runners import InMemoryRunner # Assuming this is used for direct agent running
+from google.genai import types as genai_types # For constructing ADK agent inputs
 # Project-specific imports
 from features.insight_and_tasks.data_models.tasks import (
+    TaskExtractionOutput,
+    OKR,
+    KeyResult,
+    Task,
+    EffortLevel,
+    TimelineCategory,
+    PriorityLevel,
+    TaskType,
+    DataSubject # Ensure all are imported
 )
+from features.insight_and_tasks.utils.retry_mechanism import RetryMechanism # If retries are needed for ADK calls
 # Configure logger for this module
 logger = logging.getLogger(__name__)
+DEFAULT_AGENT_MODEL = "gemini-2.5-flash-preview-05-20" # Or your specific model
 class TaskExtractionAgent:
     """
     Agent specialized in extracting actionable tasks and OKRs from analysis insights,
     with awareness of the current date and quarter.
     """
     AGENT_NAME = "task_extractor"
     AGENT_DESCRIPTION = "Specialist in converting strategic insights into specific, time-aware actionable tasks and OKRs."
     def __init__(self, api_key: str, model_name: Optional[str] = None, current_date: Optional[date] = None):
         """
         Initializes the TaskExtractionAgent.
         Args:
             api_key: API key (may be used by LlmAgent configuration or future needs).
             model_name: Name of the language model to use.
             current_date: The current date to use for quarter calculations. Defaults to today.
         """
+        self.api_key = api_key # Store if needed by LlmAgent or other components
         self.model_name = model_name or DEFAULT_AGENT_MODEL
+        self.current_date = current_date or datetime.utcnow().date() # Use date object for consistency
         # LlmAgent is initialized with dynamic instruction and output schema
         self.agent = LlmAgent(
             name=self.AGENT_NAME,
             model=self.model_name,
             description=self.AGENT_DESCRIPTION,
+            instruction=self._get_instruction_prompt(), # Instruction generated dynamically
+            output_schema=TaskExtractionOutput, # Pydantic model for structured output
+            output_key="extracted_tasks_okrs"   # Key where LlmAgent stores structured output in state
         )
+        self.retry_mechanism = RetryMechanism() # For retrying ADK runner if needed
         logger.info(f"{self.AGENT_NAME} initialized for Q{self._get_quarter(self.current_date)}, "
+                    f"{self._days_until_quarter_end(self.current_date)} days remaining in quarter. Model: {self.model_name}")
     def _get_quarter(self, d: date) -> int:
         """Calculates the quarter for a given date."""
         """Calculates the number of days remaining in the current quarter from date d."""
         current_q = self._get_quarter(d)
         year = d.year
         if current_q == 1:
             quarter_end_date = date(year, 3, 31)
         elif current_q == 2:
             quarter_end_date = date(year, 12, 31)
         days_remaining = (quarter_end_date - d).days
+        return max(0, days_remaining) # Ensure non-negative
     def _get_instruction_prompt(self) -> str:
         """Generates the dynamic instruction string for the LlmAgent."""
         quarter = self._get_quarter(self.current_date)
         days_remaining = self._days_until_quarter_end(self.current_date)
+        # Dynamically include Pydantic model field descriptions for better LLM guidance
+        # This part can be complex if done fully automatically. For now, manually summarizing key fields.
+        task_fields_summary = (
+            "Each Task must include: task_category (e.g., Content Strategy), task_description, "
+            "objective_deliverable, effort (Small, Medium, Large), timeline (Immediate, Short-term, Medium-term, Long-term), "
+            "responsible_party, success_criteria_metrics, dependencies_prerequisites (optional), "
+            "priority (High, Medium, Low) with priority_justification, why_proposed (linking to analysis), "
+            "task_type (initiative or tracking), data_subject (for tracking tasks: follower_stats, posts, mentions, general)."
+        )
         return f"""
+        You are a Time-Aware Task Extraction Specialist. Your primary function is to meticulously analyze strategic insights
+        derived from LinkedIn analytics and transform them into a structured set of actionable tasks. These tasks should be
+        organized within an Objectives and Key Results (OKRs) framework.
+        CURRENT CONTEXTUAL INFORMATION (DO NOT CHANGE THIS IN YOUR OUTPUT):
+        - Current Quarter: Q{quarter}
+        - Days remaining in current quarter: {days_remaining}
+        - Today's Date (for context): {self.current_date.isoformat()}
+        YOUR MANDATE:
+        1.  Define clear, aspirational Objectives (qualitative goals).
+        2.  For each Objective, formulate 2-3 specific, measurable Key Results.
+        3.  Under each Key Result, list detailed, actionable Tasks required to achieve it.
+        4.  CRITICAL: Each Task MUST strictly adhere to the 'Task' Pydantic model fields. This means providing values for ALL required fields: {task_fields_summary}
+        5.  Task Timelines: Must be realistic given the {days_remaining} days left in Q{quarter}. Prioritize actions that can make significant progress or be completed within this timeframe. Use TimelineCategory enum values.
+        6.  Task Types: Clearly distinguish between 'initiative' (new actions/projects) and 'tracking' (ongoing monitoring/measurement).
+        7.  Data Subjects: For 'tracking' tasks, accurately specify the relevant 'data_subject'. For 'initiative' tasks, this can be 'general' or null if not specific to one data type.
+        8.  Rationale ('why_proposed'): This is crucial. Each task's proposal must be explicitly justified by and linked back to specific findings, trends, or recommendations mentioned in the input 'comprehensive_analysis'.
+        9.  Priority: Assign a priority (High, Medium, Low) to each task and provide a 'priority_justification'.
+        INPUT: You will receive a 'comprehensive_analysis' text.
+        OUTPUT FORMAT:
+        You MUST return a single JSON object that strictly conforms to the 'TaskExtractionOutput' Pydantic schema.
+        This JSON object will contain:
 {{
   "current_quarter_info": "Q{quarter}, {days_remaining} days remaining",
   "okrs": [
   "overall_strategic_focus": "Summary of main strategic themes",
   "generation_timestamp": "{datetime.utcnow().isoformat()}"
 }}
 ## CRITICAL REQUIREMENTS:
 - High: Critical for quarter goals, high impact, urgent
 - Medium: Important but not critical, moderate impact
 - Low: Nice to have, low impact, can be delayed
+        Focus on quality, actionability, and strict adherence to the output schema.
         """
     async def extract_tasks(self, comprehensive_analysis: str) -> TaskExtractionOutput:
         """
         Extracts time-aware actionable tasks from the comprehensive analysis text.
         Args:
             comprehensive_analysis: The text analysis from which to extract tasks.
         Returns:
             A TaskExtractionOutput Pydantic model instance.
         """
         if not comprehensive_analysis or not comprehensive_analysis.strip():
             logger.warning("Comprehensive analysis text is empty. Cannot extract tasks.")
+            return TaskExtractionOutput(
+                current_quarter_info=f"Q{self._get_quarter(self.current_date)}, {self._days_until_quarter_end(self.current_date)} days remaining",
+                okrs=[],
+                overall_strategic_focus="No analysis provided to extract tasks."
+            )
+        # The LlmAgent's instruction already contains the dynamic date info and output format.
+        # The input to the agent's run method will be the comprehensive_analysis.
         prompt_for_adk_agent = f"""
+        Comprehensive Analysis for Task Extraction:
+        ---
+        {comprehensive_analysis}
+        ---
+        Based on the analysis above, and adhering strictly to your primary instructions (especially regarding current quarter context, task field requirements, and JSON output schema 'TaskExtractionOutput'), generate the OKRs and tasks.
+        Ensure the 'current_quarter_info' field in your JSON output is exactly: "Q{self._get_quarter(self.current_date)}, {self._days_until_quarter_end(self.current_date)} days remaining".
+        """
         user_input_content = genai_types.Content(
             role="user",
             parts=[genai_types.Part(text=prompt_for_adk_agent)]
         )
+        # Using InMemoryRunner as per original structure for LlmAgent with output_schema
         runner = InMemoryRunner(agent=self.agent, app_name=f"{self.AGENT_NAME}Runner")
+        # Generate a unique user_id for each run to ensure fresh session state if needed.
         user_id = f"system_user_task_extractor_{int(datetime.utcnow().timestamp())}"
         session = await runner.session_service.create_session(
         )
         extracted_data_dict = None
+        full_response_text_for_debug = "" # To capture raw text if parsing fails
         try:
             logger.info(f"Running TaskExtractionAgent for user_id: {user_id}, session_id: {session.id}")
+            # Fix: Use regular for loop instead of async for, since runner.run() returns a generator
             run_result = runner.run(
                 user_id=user_id,
                 session_id=session.id,
                 new_message=user_input_content
             )
+            # Check if it's an async iterator or regular generator
             if hasattr(run_result, '__aiter__'):
+                # It's an async iterator, use async for
                 async for event in run_result:
                     if (hasattr(event, 'actions') and event.actions and
                         hasattr(event.actions, 'state_delta') and
                         self.agent.output_key in event.actions.state_delta):
                         extracted_data_dict = event.actions.state_delta[self.agent.output_key]
+                        logger.info(f"Successfully extracted structured data via LlmAgent state_delta.")
                         break
+                    # Capture text parts for debugging if direct structured output isn't found first
                     if hasattr(event, 'content') and event.content and event.content.parts:
                         for part in event.content.parts:
                             if hasattr(part, 'text'):
+                                 full_response_text_for_debug += part.text
             else:
+                # It's a regular generator, use regular for loop
                 for event in run_result:
                     if (hasattr(event, 'actions') and event.actions and
                         hasattr(event.actions, 'state_delta') and
                         self.agent.output_key in event.actions.state_delta):
                         extracted_data_dict = event.actions.state_delta[self.agent.output_key]
+                        logger.info(f"Successfully extracted structured data via LlmAgent state_delta.")
                         break
+                    # Capture text parts for debugging if direct structured output isn't found first
                     if hasattr(event, 'content') and event.content and event.content.parts:
                         for part in event.content.parts:
                             if hasattr(part, 'text'):
+                                 full_response_text_for_debug += part.text
             if not extracted_data_dict and full_response_text_for_debug:
+                logger.warning("LlmAgent did not produce structured output in state_delta. Raw text response was: %s",
+                               full_response_text_for_debug[:500] + "...")
         except Exception as e:
             logger.error(f"Error during TaskExtractionAgent execution: {e}", exc_info=True)
         finally:
             try:
                 await runner.session_service.delete_session(
+                    app_name=f"{self.AGENT_NAME}Runner", user_id=user_id, session_id=session.id
                 )
             except Exception as session_del_e:
                 logger.error(f"Error deleting task extractor session: {session_del_e}")
         if extracted_data_dict:
+            if isinstance(extracted_data_dict, TaskExtractionOutput): # Already a Pydantic model
+                return extracted_data_dict
+            elif isinstance(extracted_data_dict, dict): # If it's a dict, parse it
+                try:
+                    return TaskExtractionOutput(**extracted_data_dict)
+                except Exception as pydantic_error:
+                    logger.error(f"Error parsing extracted dictionary into TaskExtractionOutput: {pydantic_error}", exc_info=True)
+                    logger.error(f"Problematic dictionary data: {extracted_data_dict}")
+            else:
+                logger.error(f"Extracted data is not a dictionary or TaskExtractionOutput model: {type(extracted_data_dict)}")
         # Fallback if no valid data extracted
+        logger.warning("No valid structured data extracted by TaskExtractionAgent.")
+        return TaskExtractionOutput(
+            current_quarter_info=f"Q{self._get_quarter(self.current_date)}, {self._days_until_quarter_end(self.current_date)} days remaining",
+            okrs=[],
+            overall_strategic_focus="Failed to extract tasks or no tasks were identified.",
+            generation_timestamp=datetime.utcnow().isoformat()
+        )
+    def update_current_date(self, new_date: date):
+        """
+        Updates the current date for the agent and re-initializes the LlmAgent
+        to reflect the new date context in its instructions.
+        """
+        self.current_date = new_date
+        # Re-initialize the LlmAgent with the new instruction based on the new date
+        self.agent = LlmAgent(
+            name=self.AGENT_NAME,
+            model=self.model_name,
+            description=self.AGENT_DESCRIPTION,
+            instruction=self._get_instruction_prompt(), # Get updated instruction
+            output_schema=TaskExtractionOutput,
+            output_key="extracted_tasks_okrs"
+        )
+        logger.info(f"{self.AGENT_NAME} date updated. New context: Q{self._get_quarter(self.current_date)}, "
+                    f"{self._days_until_quarter_end(self.current_date)} days remaining.")
+if __name__ == '__main__':
+    import asyncio
+    # (Ensure logging_config.py is in the same directory or PYTHONPATH is set for this example to run standalone)
+    try:
+        from utils.logging_config import setup_logging
+        setup_logging()
+        logger.info("Logging setup for TaskExtractionAgent test.")
+    except ImportError:
+        logging.basicConfig(level=logging.INFO, format="%(asctime)s - %(name)s - %(levelname)s - %(message)s")
+        logger.warning("logging_config.py not found, using basicConfig for logging.")
+    MOCK_API_KEY = os.environ.get("GOOGLE_API_KEY", "test_api_key_task_extractor") # Use your actual key or env var
+    MODEL_NAME = DEFAULT_AGENT_MODEL
+    # Example comprehensive analysis text (replace with actual analysis output)
+    sample_analysis_text = """
+    Overall Summary: Follower growth is steady at 5% MoM. Post engagement is highest for video content
+    (avg 8% engagement rate) published on weekdays. However, mentions sentiment dipped in the last month
+    (-0.2 avg score) due to complaints about customer service response times.
+    Key opportunity: Improve customer service communication and leverage video content more effectively.
+    Strategic Recommendation: Launch a 'Customer First' initiative and create a video series showcasing customer success stories.
+    """
+    # Test with a specific date
+    test_date = date(2025, 4, 15) # Example: Mid-Q2 2025
+    task_agent = TaskExtractionAgent(api_key=MOCK_API_KEY, model_name=MODEL_NAME, current_date=test_date)
+    logger.info(f"Task Agent Instruction for test_date {test_date}:\n{task_agent._get_instruction_prompt()[:500]}...")
+    async def run_extraction():
+        logger.info("Extracting tasks from sample analysis...")
+        # In a real scenario, ensure GOOGLE_API_KEY is set if the LlmAgent makes actual calls.
+        # For local tests without real API calls, the LlmAgent might behave as a mock or require specific test setup.
+        if MOCK_API_KEY == "test_api_key_task_extractor":
+             logger.warning("Using a mock API key. LlmAgent behavior might be limited or mocked for task extraction.")
+             # Mock the runner if no real API call should be made
+             class MockADKRunner:
+                def __init__(self, agent, app_name): self.agent = agent
+                async def session_service_create_session(self, app_name, user_id):
+                    class MockSession: id = "mock_session_id"
+                    return MockSession()
+                async def run(self, user_id, session_id, new_message):
+                    # Simulate a response structure
+                    mock_okr = OKR(
+                        objective_description="Improve Customer Satisfaction",
+                        key_results=[KeyResult(
+                            key_result_description="Reduce negative mentions by 10%",
+                            tasks=[Task(
+                                task_category="Customer Service", task_description="Respond to all negative mentions within 2 hours.",
+                                objective_deliverable="Improved response time.", effort=EffortLevel.MEDIUM, timeline=TimelineCategory.IMMEDIATE,
+                                responsible_party="Support Team", success_criteria_metrics="Avg response time < 2hrs.",
+                                priority=PriorityLevel.HIGH, priority_justification="Critical for reputation.",
+                                why_proposed="Analysis showed dip in sentiment due to slow responses.", task_type=TaskType.INITIATIVE,
+                                data_subject=DataSubject.MENTIONS
+                            )]
+                        )],
+                        objective_timeline=TimelineCategory.SHORT_TERM
+                    )
+                    mock_output = TaskExtractionOutput(
+                        current_quarter_info=f"Q{task_agent._get_quarter(task_agent.current_date)}, {task_agent._days_until_quarter_end(task_agent.current_date)} days remaining",
+                        okrs=[mock_okr],
+                        overall_strategic_focus="Focus on customer service improvement."
+                    )
+                    # Simulate the event structure LlmAgent with output_schema would produce
+                    class MockEvent:
+                        def __init__(self):
+                            self.actions = type('Actions', (), {'state_delta': {task_agent.agent.output_key: mock_output.model_dump()}})() # .model_dump() for Pydantic v2
+                    yield MockEvent()
+                async def session_service_delete_session(self, app_name, user_id, session_id): pass
+             # Monkey patch the InMemoryRunner for this test if using mock key
+             global InMemoryRunner
+             OriginalInMemoryRunner = InMemoryRunner
+             InMemoryRunner = MockADKRunner
+        extracted_okrs_output = await task_agent.extract_tasks(sample_analysis_text)
+        # Restore InMemoryRunner if it was patched
+        if MOCK_API_KEY == "test_api_key_task_extractor" and 'OriginalInMemoryRunner' in globals():
+            InMemoryRunner = OriginalInMemoryRunner
+        print("\n--- TaskExtractionAgent Results ---")
+        if extracted_okrs_output:
+            print(f"Current Quarter Info: {extracted_okrs_output.current_quarter_info}")
+            print(f"Overall Strategic Focus: {extracted_okrs_output.overall_strategic_focus}")
+            print(f"Generated Timestamp: {extracted_okrs_output.generation_timestamp}")
+            print("\nOKRs Extracted:")
+            # Use .model_dump_json() for Pydantic v2 for pretty printing
+            print(extracted_okrs_output.model_dump_json(indent=2))
+        else:
+            print("No OKRs extracted or an error occurred.")
+    if __name__ == '__main__': # This check is technically inside another if __name__ == '__main__'
+        asyncio.run(run_extraction())
+        # Example of updating date
+        logger.info("\n--- Updating date for Task Agent ---")
+        new_test_date = date(2025, 10, 5) # Q4
+        task_agent.update_current_date(new_test_date)
+        # The instruction within task_agent.agent is now updated.
+        # logger.info(f"Task Agent NEW Instruction for test_date {new_test_date}:\n{task_agent.agent.instruction[:500]}...")
+        # A new call to extract_tasks would use this updated context.