Spaces:

MicroHealth
/

proposal-writer

Paused

App Files Files Community

bluenevus commited on Apr 28

Commit

c7006a6

1 Parent(s): 20f1559

Update app.py via AI Editor

Browse files

Files changed (1) hide show

app.py +161 -53

app.py CHANGED Viewed

@@ -11,6 +11,8 @@ import dash_bootstrap_components as dbc
 from dash import html, dcc, Input, Output, State, dash_table, callback_context
 logging.basicConfig(level=logging.INFO)
 ANTHROPIC_KEY = os.environ.get("ANTHROPIC_API_KEY", "")
 import anthropic
 anthropic_client = anthropic.Anthropic(api_key=ANTHROPIC_KEY)
@@ -31,36 +33,52 @@ document_types = {
 }
 def process_document(contents, filename):
-    content_type, content_string = contents.split(',')
-    decoded = base64.b64decode(content_string)
-    if filename.lower().endswith('.docx'):
-        doc = Document(BytesIO(decoded))
-        return "\n".join([p.text for p in doc.paragraphs])
-    elif filename.lower().endswith('.pdf'):
-        pdf = PdfReader(BytesIO(decoded))
-        return "".join(page.extract_text() or "" for page in pdf.pages)
-    else:
-        return f"Unsupported file format: {filename}"
 def call_claude(prompt, max_tokens=2048):
-    res = anthropic_client.messages.create(
-        model=CLAUDE3_SONNET_MODEL,
-        max_tokens=max_tokens,
-        temperature=0.1,
-        system="You are a world class proposal consultant and proposal manager.",
-        messages=[{"role": "user", "content": prompt}]
-    )
-    return res.content[0].text if hasattr(res, "content") else str(res)
 def spreadsheet_to_df(text):
     lines = [l.strip() for l in text.splitlines() if '|' in l]
-    if not lines: return pd.DataFrame()
     header = lines[0].strip('|').split('|')
     data = [l.strip('|').split('|') for l in lines[1:]]
     return pd.DataFrame(data, columns=[h.strip() for h in header])
-def generate_content(document, doc_type):
-    prompt = f"{document_types[doc_type]}\n\nDocument:\n{document}\n\nOutput only one spreadsheet table, use | as column separator."
     response = call_claude(prompt, max_tokens=4096)
     df = spreadsheet_to_df(response)
     return response, df
@@ -104,25 +122,47 @@ def make_textarea(btn_id, placeholder):
         style={'height': '80px', 'marginBottom': '10px', 'width': '100%', 'whiteSpace': 'pre-wrap', 'overflowWrap': 'break-word'}
     )
-def make_tab(tab_id, label):
     return dbc.Card(
         dbc.CardBody([
-            make_textarea(tab_id, f"Instructions for {label} (optional)"),
-            make_upload(tab_id),
-            dbc.Button(f"Generate {label}", id=f'{tab_id}-btn', className="mt-2 btn-primary", n_clicks=0),
-            dcc.Loading(html.Div(id=f'{tab_id}-output'), type="default", parent_style={'justifyContent': 'center'}),
-            dbc.Button(f"Download {label} Report", id=f"{tab_id}-download-btn", className="mt-2 btn-secondary", n_clicks=0),
-            dcc.Download(id=f"{tab_id}-download")
-        ]), className="mb-4"
     )
 tab_cards = {tab["id"]: make_tab(tab["id"], tab["label"]) for tab in main_tabs}
 nav_items = [
     dbc.NavLink(tab["label"], href="#", id=f"nav-{tab['id']}", active=(tab["id"] == "shred")) for tab in main_tabs
 ]
-# Render all tab cards, only one visible at a time
 def all_tabs_div():
     return html.Div(
         [
@@ -173,6 +213,45 @@ def display_tab(*nav_clicks):
             styles.append({"display": "none"})
     return styles
 @app.callback(
     [Output(f'{tab_id}-output', 'children') for tab_id in tab_cards] +
     [Output(f"{tab_id}-download", "data") for tab_id in tab_cards],
@@ -181,14 +260,17 @@ def display_tab(*nav_clicks):
     [State(f'{tab_id}-upload', 'contents') for tab_id in tab_cards] +
     [State(f'{tab_id}-upload', 'filename') for tab_id in tab_cards] +
     [State(f'{tab_id}-instructions', 'value') for tab_id in tab_cards] +
-    [State(f'{tab_id}-output', 'children') for tab_id in tab_cards]
 )
 def handle_all_tabs(*args):
     n = len(tab_cards)
     outputs = [None] * (n * 2)
     ctx = callback_context
-    if not ctx.triggered: return outputs
     trig = ctx.triggered[0]['prop_id']
     for idx, tab_id in enumerate(tab_cards):
         gen_btn = f"{tab_id}-btn.n_clicks"
         dl_btn = f"{tab_id}-download-btn.n_clicks"
@@ -198,31 +280,57 @@ def handle_all_tabs(*args):
         filename_idx = idx + n
         instr_idx = idx + 2 * n
         prev_output_idx = idx + 3 * n
         if trig == gen_btn:
-            upload = args[upload_idx]
-            filename = args[filename_idx]
-            instr = args[instr_idx] or ""
-            doc_type = tab_id.replace('-', ' ').title().replace(' ', '')
-            doc_type = next((k for k in document_types if k.lower().replace(' ', '') == tab_id.replace('-', '')), tab_id.title())
-            if upload and filename:
-                doc = process_document(upload, filename)
-            else:
-                doc = ""
-            if doc or tab_id == "virtual-board":
-                content, df = generate_content(doc, doc_type)
-                if not df.empty:
-                    outputs[out_idx] = dash_table.DataTable(
-                        data=df.to_dict('records'),
-                        columns=[{'name': i, 'id': i} for i in df.columns],
-                        style_table={'overflowX': 'auto'},
-                        style_cell={'textAlign': 'left', 'padding': '5px'},
-                        style_header={'fontWeight': 'bold'}
-                    )
                 else:
-                    outputs[out_idx] = dcc.Markdown(content)
             else:
-                outputs[out_idx] = "Please upload a document to begin."
         elif trig == dl_btn:
             prev_output = args[prev_output_idx]
             if prev_output and hasattr(prev_output, 'props') and 'data' in prev_output.props:

 from dash import html, dcc, Input, Output, State, dash_table, callback_context
 logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger("microhealth-pws")
 ANTHROPIC_KEY = os.environ.get("ANTHROPIC_API_KEY", "")
 import anthropic
 anthropic_client = anthropic.Anthropic(api_key=ANTHROPIC_KEY)
 }
 def process_document(contents, filename):
+    try:
+        content_type, content_string = contents.split(',')
+        decoded = base64.b64decode(content_string)
+        if filename.lower().endswith('.docx'):
+            doc = Document(BytesIO(decoded))
+            text = "\n".join([p.text for p in doc.paragraphs])
+            return text
+        elif filename.lower().endswith('.pdf'):
+            pdf = PdfReader(BytesIO(decoded))
+            text = "".join(page.extract_text() or "" for page in pdf.pages)
+            return text
+        else:
+            return f"Unsupported file format: {filename}"
+    except Exception as e:
+        logger.error(f"Error processing document {filename}: {e}")
+        return f"Failed to process document: {e}"
 def call_claude(prompt, max_tokens=2048):
+    try:
+        res = anthropic_client.messages.create(
+            model=CLAUDE3_SONNET_MODEL,
+            max_tokens=max_tokens,
+            temperature=0.1,
+            system="You are a world class proposal consultant and proposal manager.",
+            messages=[{"role": "user", "content": prompt}]
+        )
+        logger.info("Anthropic API call successful.")
+        return res.content[0].text if hasattr(res, "content") else str(res)
+    except Exception as e:
+        logger.error(f"Anthropic API error: {e}")
+        return f"Anthropic API error: {e}"
 def spreadsheet_to_df(text):
     lines = [l.strip() for l in text.splitlines() if '|' in l]
+    if not lines:
+        return pd.DataFrame()
     header = lines[0].strip('|').split('|')
     data = [l.strip('|').split('|') for l in lines[1:]]
     return pd.DataFrame(data, columns=[h.strip() for h in header])
+def generate_content(document, doc_type, instructions=""):
+    prompt = f"{document_types[doc_type]}\n\n"
+    if instructions:
+        prompt += f"Additional Instructions:\n{instructions}\n\n"
+    prompt += f"Document:\n{document}\n\nOutput only one spreadsheet table, use | as column separator."
+    logger.info(f"Generating content for {doc_type} with prompt length {len(prompt)}")
     response = call_claude(prompt, max_tokens=4096)
     df = spreadsheet_to_df(response)
     return response, df
         style={'height': '80px', 'marginBottom': '10px', 'width': '100%', 'whiteSpace': 'pre-wrap', 'overflowWrap': 'break-word'}
     )
+def make_shred_doc_preview():
     return dbc.Card(
         dbc.CardBody([
+            html.Div(id="shred-upload-preview", style={"whiteSpace": "pre-wrap", "overflowWrap": "break-word"}),
+            dbc.Button("Delete Document", id="shred-delete-btn", className="mt-2 btn-tertiary", n_clicks=0)
+        ]), className="mb-2", id="shred-doc-preview-card", style={"display": "none"}
     )
+def make_tab(tab_id, label):
+    if tab_id == "shred":
+        # Insert doc preview card for shred
+        return dbc.Card(
+            dbc.CardBody([
+                make_textarea(tab_id, f"Instructions for {label} (optional)"),
+                make_upload(tab_id),
+                make_shred_doc_preview(),
+                dbc.Button(f"Generate {label}", id=f'{tab_id}-btn', className="mt-2 btn-primary", n_clicks=0),
+                dcc.Loading(html.Div(id=f'{tab_id}-output'), id="loading", type="default", parent_style={'justifyContent': 'center'}),
+                dbc.Button(f"Download {label} Report", id=f"{tab_id}-download-btn", className="mt-2 btn-secondary", n_clicks=0),
+                dcc.Download(id=f"{tab_id}-download"),
+                dcc.Store(id="shred-upload-store")
+            ]), className="mb-4"
+        )
+    else:
+        return dbc.Card(
+            dbc.CardBody([
+                make_textarea(tab_id, f"Instructions for {label} (optional)"),
+                make_upload(tab_id),
+                dbc.Button(f"Generate {label}", id=f'{tab_id}-btn', className="mt-2 btn-primary", n_clicks=0),
+                dcc.Loading(html.Div(id=f'{tab_id}-output'), type="default", parent_style={'justifyContent': 'center'}),
+                dbc.Button(f"Download {label} Report", id=f"{tab_id}-download-btn", className="mt-2 btn-secondary", n_clicks=0),
+                dcc.Download(id=f"{tab_id}-download")
+            ]), className="mb-4"
+        )
 tab_cards = {tab["id"]: make_tab(tab["id"], tab["label"]) for tab in main_tabs}
 nav_items = [
     dbc.NavLink(tab["label"], href="#", id=f"nav-{tab['id']}", active=(tab["id"] == "shred")) for tab in main_tabs
 ]
 def all_tabs_div():
     return html.Div(
         [
             styles.append({"display": "none"})
     return styles
+@app.callback(
+    [
+        Output("shred-upload-store", "data"),
+        Output("shred-upload-preview", "children"),
+        Output("shred-doc-preview-card", "style"),
+    ],
+    [
+        Input("shred-upload", "contents"),
+        Input("shred-delete-btn", "n_clicks")
+    ],
+    [
+        State("shred-upload", "filename"),
+        State("shred-upload-store", "data"),
+    ],
+    prevent_initial_call=True
+)
+def update_shred_upload(contents, delete_clicks, filename, stored_data):
+    triggered = callback_context.triggered
+    logger.info("Shred upload callback triggered.")
+    if not triggered:
+        return dash.no_update, dash.no_update, dash.no_update
+    trig_id = triggered[0]["prop_id"].split(".")[0]
+    if trig_id == "shred-upload":
+        if contents and filename:
+            logger.info(f"Document uploaded in Shred: {filename}")
+            text = process_document(contents, filename)
+            preview = html.Div([
+                html.B(f"Uploaded: {filename}"),
+                html.Br(),
+                html.Div(text[:2000] + ("..." if len(text) > 2000 else ""), style={"whiteSpace": "pre-wrap", "overflowWrap": "break-word", "fontSize": "small"})
+            ])
+            return {"contents": contents, "filename": filename, "preview": text[:2000]}, preview, {"display": "block"}
+        else:
+            return None, "", {"display": "none"}
+    elif trig_id == "shred-delete-btn":
+        logger.info("Shred document deleted by user.")
+        return None, "", {"display": "none"}
+    return dash.no_update, dash.no_update, dash.no_update
 @app.callback(
     [Output(f'{tab_id}-output', 'children') for tab_id in tab_cards] +
     [Output(f"{tab_id}-download", "data") for tab_id in tab_cards],
     [State(f'{tab_id}-upload', 'contents') for tab_id in tab_cards] +
     [State(f'{tab_id}-upload', 'filename') for tab_id in tab_cards] +
     [State(f'{tab_id}-instructions', 'value') for tab_id in tab_cards] +
+    [State(f'{tab_id}-output', 'children') for tab_id in tab_cards] +
+    [State("shred-upload-store", "data")]
 )
 def handle_all_tabs(*args):
     n = len(tab_cards)
     outputs = [None] * (n * 2)
     ctx = callback_context
+    if not ctx.triggered:
+        return outputs
     trig = ctx.triggered[0]['prop_id']
+    logger.info(f"Main callback triggered by {trig}")
     for idx, tab_id in enumerate(tab_cards):
         gen_btn = f"{tab_id}-btn.n_clicks"
         dl_btn = f"{tab_id}-download-btn.n_clicks"
         filename_idx = idx + n
         instr_idx = idx + 2 * n
         prev_output_idx = idx + 3 * n
+        shred_upload_store_idx = 4 * n
         if trig == gen_btn:
+            logger.info(f"Generate button pressed for {tab_id}")
+            if tab_id == "shred":
+                # Use stored doc for Shred
+                shred_data = args[shred_upload_store_idx]
+                instr = args[instr_idx] or ""
+                if shred_data and "contents" in shred_data and "filename" in shred_data:
+                    doc = process_document(shred_data["contents"], shred_data["filename"])
+                    logger.info(f"Shred document will be sent to Anthropic with instructions: {instr}")
+                    content, df = generate_content(doc, "Shred", instr)
+                    if not df.empty:
+                        outputs[out_idx] = dash_table.DataTable(
+                            data=df.to_dict('records'),
+                            columns=[{'name': i, 'id': i} for i in df.columns],
+                            style_table={'overflowX': 'auto'},
+                            style_cell={'textAlign': 'left', 'padding': '5px'},
+                            style_header={'fontWeight': 'bold'}
+                        )
+                    else:
+                        outputs[out_idx] = html.Div([
+                            html.B("Anthropic Response Preview:"),
+                            dcc.Markdown(content)
+                        ])
                 else:
+                    outputs[out_idx] = "Please upload a document to begin."
             else:
+                upload = args[upload_idx]
+                filename = args[filename_idx]
+                instr = args[instr_idx] or ""
+                doc_type = tab_id.replace('-', ' ').title().replace(' ', '')
+                doc_type = next((k for k in document_types if k.lower().replace(' ', '') == tab_id.replace('-', '')), tab_id.title())
+                if upload and filename:
+                    doc = process_document(upload, filename)
+                else:
+                    doc = ""
+                if doc or tab_id == "virtual-board":
+                    content, df = generate_content(doc, doc_type, instr)
+                    if not df.empty:
+                        outputs[out_idx] = dash_table.DataTable(
+                            data=df.to_dict('records'),
+                            columns=[{'name': i, 'id': i} for i in df.columns],
+                            style_table={'overflowX': 'auto'},
+                            style_cell={'textAlign': 'left', 'padding': '5px'},
+                            style_header={'fontWeight': 'bold'}
+                        )
+                    else:
+                        outputs[out_idx] = dcc.Markdown(content)
+                else:
+                    outputs[out_idx] = "Please upload a document to begin."
         elif trig == dl_btn:
             prev_output = args[prev_output_idx]
             if prev_output and hasattr(prev_output, 'props') and 'data' in prev_output.props: