Spaces:

MicroHealth
/

proposal-writer

Paused

App Files Files Community

bluenevus commited on Apr 28

Commit

43e6676

1 Parent(s): 83acb90

Update app.py via AI Editor

Browse files

Files changed (1) hide show

app.py +77 -30

app.py CHANGED Viewed

@@ -16,6 +16,7 @@ import logging
 import uuid
 import xlsxwriter # Needed for Excel export engine
 import threading # For multi-threading
 # --- Logging Configuration ---
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
@@ -75,7 +76,7 @@ uploaded_pink_content = {}
 uploaded_red_content = {}
 uploaded_gold_content = {}
-# {session_id: {'doc': content, 'type': doc_type}} - Store the currently displayed document and its type for download/chat per session
 current_display_document = {}
 # --- Document Types ---
@@ -96,7 +97,7 @@ app.layout = dbc.Container(fluid=True, className="dbc", children=[
     dcc.Store(id='session-id', storage_type='session'), # Store for unique session ID
     # Title Row
     dbc.Row(
-        dbc.Col(html.H1("Proposal AI Assistant", className="text-center my-4"), width=12) # Removed inline style
     ),
     # Progress Indicator Row
@@ -118,7 +119,7 @@ app.layout = dbc.Container(fluid=True, className="dbc", children=[
     # Main Content Row
     dbc.Row([
-        # Left Column (Nav/Upload) - 30% width on large screens
         dbc.Col(
             dbc.Card(
                 dbc.CardBody([
@@ -151,14 +152,16 @@ app.layout = dbc.Container(fluid=True, className="dbc", children=[
                               ) for doc_type in document_types.keys()]
                          ])
                     )
-                ])
-             , color="light", className="h-100"), # Use bootstrap class for background, ensure full height
-            width=12, lg=4, # Full width on small, 4/12 (33%) on large
             className="mb-3 mb-lg-0",
             style={'paddingRight': '15px'} # Add padding between columns
         ),
-        # Right Column (Status/Preview/Controls/Chat) - 70% width on large screens
         dbc.Col(
             dbc.Card(
                 dbc.CardBody([
@@ -194,9 +197,11 @@ app.layout = dbc.Container(fluid=True, className="dbc", children=[
                             )
                          ]), className="mb-3"
                      )
-                ])
-             , className="h-100"), # Ensure full height
-            width=12, lg=8, # Full width on small, 8/12 (67%) on large
             style={'paddingLeft': '15px'} # Add padding between columns
         )
     ])
@@ -214,6 +219,36 @@ def get_session_id(session_id_value=None):
     logging.info(f"Generated new session ID: {new_id}")
     return new_id
 def process_document(contents, filename):
     """Processes uploaded file content (PDF or DOCX) and returns text, or None and error message."""
     if contents is None:
@@ -256,44 +291,56 @@ def process_document(contents, filename):
         logging.error(f"Error processing document {filename}: {e}", exc_info=True)
         return None, f"Error processing file {filename}: {str(e)}"
-def get_combined_uploaded_text(session_id):
-    """Combines text content of all successfully uploaded files for a session."""
     with data_lock:
-        session_files = uploaded_files.get(session_id, {})
         if not session_files:
             return ""
-        return "\n\n--- FILE BREAK ---\n\n".join(session_files.values())
-def generate_ai_document(session_id, doc_type, input_docs, context_docs=None):
-    """Generates document using Gemini AI. Updates current_display for the session."""
-    global current_display_document # Modifying global state
     if not model:
         logging.error(f"[{session_id}] Gemini AI model not initialized.")
-        return "Error: AI Model not configured. Please check API Key."
     if not input_docs or not any(doc.strip() for doc in input_docs if doc):
         logging.warning(f"[{session_id}] generate_ai_document called for {doc_type} with no valid input documents.")
-        return f"Error: Missing required input document(s) for {doc_type} generation."
     combined_input = "\n\n---\n\n".join(filter(None, input_docs))
     combined_context = "\n\n---\n\n".join(filter(None, context_docs)) if context_docs else ""
-    # Updated Prompt - Ensure it's correctly terminated
     prompt = f"""**Objective:** Generate the '{doc_type}' document.
-**Your Role:** Act as an expert proposal writer/analyst.
 **Core Instructions:**
-1.  **Adhere Strictly to the Task:** Generate *only* the content for the '{doc_type}'. Do not add introductions, summaries, or conversational filler unless it's part of the requested document format itself.
-2.  **Follow Format Guidelines:**
-    *   **Spreadsheet Types (Shred, Reviews, LOE, Board):** Structure output clearly. Use Markdown tables or a delimited format (like CSV) suitable for parsing. Define clear columns (e.g., `PWS_Section | Requirement | Finding | Recommendation` for reviews; `Section | Task | Estimated_Hours | Resource_Type` for LOE). Use '|' as the primary delimiter for tables.
-    *   **Proposal Sections (Pink, Red, Gold):** Write professional, compelling prose. Use active voice ("MicroHealth will..."). Directly address requirements from context (Shredded PWS). Detail the 'how' (technical approach, methodology, workflow, tools). Incorporate innovation and benefits (efficiency, quality, outcomes). Substantiate claims (e.g., cite Gartner, Forrester if applicable). Clearly state roles/responsibilities (labor categories). Ensure compliance with Section L/M (Evaluation Criteria) from context. Avoid vague terms ('might', 'could', 'potentially'); be assertive and confident. Use paragraphs primarily; limit bullet points to lists where essential.
-3.  **Utilize Provided Documents:**
-    *   **Context Document(s):** Use these as the primary reference or baseline (e.g., Shredded Requirements are the basis for compliance).
-    *   **Primary Input Document(s):** This is the main subject of the task (e.g., the PWS to be Shredded, the Pink draft to be Reviewed, the Review findings to incorporate into the next draft).
 **Provided Documents:**
-**Context Document(s) (e.g., Shredded Requirements, PWS Section L/M):**
 ```text
 {combined_context if combined_context else "N/A"}
 ```
-**Primary Input Document(s) (e.g., PWS text, Pink Draft text, Review Findings text):**
 ```text
 {combined_input}

 import uuid
 import xlsxwriter # Needed for Excel export engine
 import threading # For multi-threading
+import time # For progress indicator
 # --- Logging Configuration ---
 logging.basicConfig(level=logging.INFO, format='%(asctime)s - %(levelname)s - %(message)s')
 uploaded_red_content = {}
 uploaded_gold_content = {}
+# {session_id: {'doc': content, 'type': doc_type, 'format': format}} - Store the currently displayed document, its type, and format for download/chat per session
 current_display_document = {}
 # --- Document Types ---
     dcc.Store(id='session-id', storage_type='session'), # Store for unique session ID
     # Title Row
     dbc.Row(
+        dbc.Col(html.H1("Proposal AI Assistant", className="text-center my-4"), width=12)
     ),
     # Progress Indicator Row
     # Main Content Row
     dbc.Row([
+        # Left Column (Nav/Upload) - lg=4 (approx 33%)
         dbc.Col(
             dbc.Card(
                 dbc.CardBody([
                               ) for doc_type in document_types.keys()]
                          ])
                     )
+                ]),
+                # color="light", # Let CSS handle background
+                className="h-100 left-nav-card", # Add custom class for CSS targeting
+            ),
+            width=12, lg=4, # Full width on small, 4/12 on large
             className="mb-3 mb-lg-0",
             style={'paddingRight': '15px'} # Add padding between columns
         ),
+        # Right Column (Status/Preview/Controls/Chat) - lg=8 (approx 67%)
         dbc.Col(
             dbc.Card(
                 dbc.CardBody([
                             )
                          ]), className="mb-3"
                      )
+                ]),
+                # color="white", # Let CSS handle background
+                className="h-100 right-nav-card", # Add custom class for CSS targeting
+            ),
+            width=12, lg=8, # Full width on small, 8/12 on large
             style={'paddingLeft': '15px'} # Add padding between columns
         )
     ])
     logging.info(f"Generated new session ID: {new_id}")
     return new_id
+def parse_generated_content(content_text):
+    """Attempts to parse AI-generated content into a DataFrame if it looks like a table."""
+    try:
+        # Simple check: does it contain multiple lines and pipe characters?
+        if content_text and '\n' in content_text and '|' in content_text:
+            # Try parsing as Markdown-like table (skip lines that don't fit)
+            lines = [line.strip() for line in content_text.strip().split('\n')]
+            # Remove separator lines like |---|---|
+            lines = [line for line in lines if not all(c in '-| ' for c in line)]
+            if len(lines) > 1:
+                # Use the first line as header, split by '|'
+                header = [h.strip() for h in lines[0].strip('|').split('|')]
+                data_rows = []
+                for line in lines[1:]:
+                    values = [v.strip() for v in line.strip('|').split('|')]
+                    if len(values) == len(header): # Ensure matching column count
+                        data_rows.append(values)
+                    else:
+                        logging.warning(f"Skipping row due to mismatched columns: {line}")
+                if data_rows:
+                    df = pd.DataFrame(data_rows, columns=header)
+                    logging.info("Successfully parsed generated content as DataFrame.")
+                    return df
+    except Exception as e:
+        logging.warning(f"Could not parse content into DataFrame: {e}. Treating as plain text.")
+    # If parsing fails or it doesn't look like a table, return None
+    logging.info("Content does not appear to be a table or parsing failed. Treating as plain text.")
+    return None
 def process_document(contents, filename):
     """Processes uploaded file content (PDF or DOCX) and returns text, or None and error message."""
     if contents is None:
         logging.error(f"Error processing document {filename}: {e}", exc_info=True)
         return None, f"Error processing file {filename}: {str(e)}"
+def get_combined_uploaded_text(session_id, file_dict):
+    """Combines text content of files in the provided dictionary for a session."""
     with data_lock:
+        session_files = file_dict.get(session_id, {})
         if not session_files:
             return ""
+        # Combine content, adding filenames for context if multiple files
+        if len(session_files) > 1:
+            return "\n\n--- FILE BREAK ---\n\n".join(
+                f"**File: {fname}**\n\n{content}" for fname, content in session_files.items()
+            )
+        else:
+            return next(iter(session_files.values()), "")
+def generate_ai_document(session_id, doc_type, input_docs, context_docs=None):
+    """Generates document using Gemini AI. Returns generated content and format ('text' or 'dataframe')."""
     if not model:
         logging.error(f"[{session_id}] Gemini AI model not initialized.")
+        return "Error: AI Model not configured. Please check API Key.", 'text'
     if not input_docs or not any(doc.strip() for doc in input_docs if doc):
         logging.warning(f"[{session_id}] generate_ai_document called for {doc_type} with no valid input documents.")
+        return f"Error: Missing required input document(s) for {doc_type} generation.", 'text'
     combined_input = "\n\n---\n\n".join(filter(None, input_docs))
     combined_context = "\n\n---\n\n".join(filter(None, context_docs)) if context_docs else ""
+    # Define expected output format based on doc_type
+    is_spreadsheet_type = doc_type in ["Shred", "Pink Review", "Red Review", "Gold Review", "LOE", "Virtual Board"]
+    output_format_instruction = """**Output Format:** Structure the output as a clear, parseable Markdown table. Use '|' as the column delimiter. Define meaningful column headers relevant to the task (e.g., PWS_Section, Requirement, Action_Verb for Shred; Section, Requirement, Compliance_Status, Finding, Recommendation for Reviews; Section, Task, Estimated_Hours, Resource_Type for LOE). Ensure each row corresponds to a distinct item (e.g., requirement, finding, task).""" if is_spreadsheet_type else """**Output Format:** Write professional, compelling proposal prose. Use clear paragraphs and standard formatting. Address all requirements logically. Avoid tables unless explicitly part of the proposal structure."""
     prompt = f"""**Objective:** Generate the '{doc_type}' document.
+**Your Role:** Act as an expert proposal writer/analyst specialized in government contracting.
 **Core Instructions:**
+1.  **Adhere Strictly to the Task:** Generate *only* the content for the '{doc_type}'. Do not add introductions, summaries, explanations, or conversational filler unless it's part of the requested document format itself (e.g., an executive summary within a proposal draft).
+2.  **Follow Format Guidelines:** {output_format_instruction}
+3.  **Content Requirements:**
+    *   **Shred:** Identify requirements (explicit and implied), action verbs (shall, will, must, provide, perform, etc.), and PWS section references.
+    *   **Proposal Sections (Pink, Red, Gold):** Write compliant and compelling content. Directly address requirements from the Context Document(s). Detail the 'how' (approach, methodology, tools). Incorporate win themes, strengths, and discriminators. Substantiate claims. Use active voice ("Our team will..."). Ensure compliance with evaluation criteria (e.g., Section L/M). Clearly map responses back to PWS requirements.
+    *   **Reviews (Pink, Red, Gold):** Evaluate the submitted draft against the requirements (Shred/PWS) and previous review findings (if applicable). Identify compliance issues, gaps, weaknesses, and areas for improvement. Provide actionable recommendations. Be specific and reference relevant sections.
+    *   **LOE:** Estimate the Level of Effort (hours, resource types) required to fulfill each major task or requirement identified in the Shred/PWS. Justify estimates briefly if necessary.
+    *   **Virtual Board:** Simulate a source selection evaluation. Assess the final proposal against the PWS/Shred and evaluation criteria (Sec L/M). Assign strengths, weaknesses, deficiencies, risks. Provide a summary evaluation.
+4.  **Utilize Provided Documents:**
+    *   **Context Document(s):** These provide the baseline or reference material (e.g., Shredded Requirements, PWS Section L/M, Previous Review Findings). Refer to them diligently.
+    *   **Primary Input Document(s):** This is the main subject of the task (e.g., the PWS text to be Shredded, the Pink draft to be Reviewed, the Red Review findings to incorporate into the Gold draft). Analyze and process this document according to the task.
 **Provided Documents:**
+**Context Document(s):**
 ```text
 {combined_context if combined_context else "N/A"}
 ```
+**Primary Input Document(s):**
 ```text
 {combined_input}