Spaces:

shukdevdatta123
/

Systematic-Research-Paper-Review

Sleeping

App Files Files Community

shukdevdatta123 commited on May 11

Commit

6fe23ea

verified ·

1 Parent(s): f8308a2

Update app.py

Browse files

Files changed (1) hide show

app.py +237 -11

app.py CHANGED Viewed

@@ -24,8 +24,119 @@ def extract_text_from_pdf(pdf_path):
     except Exception as e:
         return f"Error extracting text from PDF: {str(e)}"
 # Function to interact with OpenAI API for systematic review
-def generate_systematic_review(pdf_files, review_question, include_tables=True):
     if not api_key:
         return "Please enter your OpenAI API key first."
@@ -78,6 +189,8 @@ def generate_systematic_review(pdf_files, review_question, include_tables=True):
         Include a comprehensive reference list following a specific citation style (APA, Vancouver, etc.). Provide links to source papers when available.
         Your response should be formatted in HTML (but avoid showing these tags ```html ```) but generate the content to look like a professional academic paper. Include proper section headers, abstracts, methodology sections, etc. Number all sections like an academic paper. Follow academic journal standards with double spacing, appropriate margins, and consistent formatting throughout.
         """
         # Extract text from each PDF
@@ -100,8 +213,22 @@ def generate_systematic_review(pdf_files, review_question, include_tables=True):
         table_instruction = ""
         if include_tables:
             table_instruction = " Please include important new generated tables in your review."
-        user_prompt = f"Please generate a systematic review of the following {len(pdf_files)} papers: {', '.join(pdf_names)}.{table_instruction}\n\nReview Question: {review_question}"
         # Create the messages for the API call
         messages = [
@@ -121,6 +248,41 @@ def generate_systematic_review(pdf_files, review_question, include_tables=True):
         # Get the AI response
         review_content = response["choices"][0]["message"]["content"]
         # Apply professional academic paper styling
         styled_html = f"""
         <!DOCTYPE html>
@@ -244,6 +406,13 @@ def generate_systematic_review(pdf_files, review_question, include_tables=True):
                     font-size: 12px;
                     color: #777;
                 }}
                 @media print {{
                     body {{
                         background-color: white;
@@ -422,18 +591,36 @@ custom_css = """
         border-radius: 8px;
     }
     /* Responsive adjustments */
     @media screen and (max-width: 768px) {
         .gradio-container {
             padding: 10px;
         }
     }
 </style>
 """
 # Gradio UI Layout with improved styling
 with gr.Blocks(css=custom_css) as demo:
-    gr.Markdown("# Systematic Review Generator for Research Papers")
     with gr.Accordion("How to Use This App", open=False):
         gr.Markdown("""
@@ -441,9 +628,15 @@ with gr.Blocks(css=custom_css) as demo:
         1. Enter your OpenAI API key in the field below and click "Set API Key"
         2. Upload multiple PDF research papers (2 or more recommended)
         3. Enter your review question or topic
-        4. Check the "Include Tables" option if you want the review to include comparison tables
-        5. Click "Generate Systematic Review" to start the process
-        6. After generation, you can download the review as HTML
         ### Tips for Best Results:
         - Upload papers that are related to the same research topic or field
@@ -472,6 +665,22 @@ with gr.Blocks(css=custom_css) as demo:
                 placeholder="e.g., What are the effects of mindfulness meditation on stress reduction?"
             )
             include_tables = gr.Checkbox(label="Include Comparison Tables", value=True)
             generate_button = gr.Button("Generate Systematic Review", elem_id="generate_button", size="large")
     # Download link container
@@ -485,7 +694,10 @@ with gr.Blocks(css=custom_css) as demo:
     api_key_button.click(set_api_key, inputs=[api_key_input], outputs=[api_key_output])
     # Generate systematic review
-    def process_files_and_generate_review(files, question, include_tables):
         if not files:
             return ("""
             <div style="padding: 20px; border: 1px solid #e0e0e0; border-radius: 5px; background-color: #f9f9f9;">
@@ -500,7 +712,7 @@ with gr.Blocks(css=custom_css) as demo:
         # Show loading message
         loading_message = """
         <div style="padding: 20px; text-align: center;">
-            <h3>Generating Systematic Review...</h3>
             <p>This may take a few minutes depending on the number and size of papers.</p>
             <div style="width: 100%; height: 4px; background-color: #f0f0f0; margin: 20px 0; border-radius: 2px; overflow: hidden;">
                 <div style="width: 30%; height: 100%; background: linear-gradient(90deg, #4a00e0, #8e2de2); animation: progress 2s infinite linear;"></div>
@@ -516,8 +728,19 @@ with gr.Blocks(css=custom_css) as demo:
         yield loading_message, ""
-        # Generate review
-        review = generate_systematic_review(saved_paths, question, include_tables)
         # Create HTML download link
         html_link = create_html_download_link(review)
@@ -543,7 +766,10 @@ with gr.Blocks(css=custom_css) as demo:
     generate_button.click(
         process_files_and_generate_review,
-        inputs=[pdf_files, review_question, include_tables],
         outputs=[review_output, download_html_output]
     )

     except Exception as e:
         return f"Error extracting text from PDF: {str(e)}"
+# Function to generate PRISMA flow chart SVG
+def generate_prisma_flow_chart(records_db, records_other, duplicates, excluded_screening, excluded_fulltext, included_studies,
+                              included_meta=None, fulltext_assessed=None):
+    # Calculate values if not provided
+    if fulltext_assessed is None:
+        fulltext_assessed = excluded_fulltext + included_studies
+    records_after_duplicates = records_db + records_other - duplicates
+    # Create SVG content for PRISMA flow chart
+    svg_content = f'''
+    <svg xmlns="http://www.w3.org/2000/svg" viewBox="0 0 800 800" width="700" height="700">
+        <style>
+            .box {{
+                fill: #f9f9f9;
+                stroke: #333;
+                stroke-width: 2;
+            }}
+            .arrow {{
+                stroke: #333;
+                stroke-width: 2;
+                marker-end: url(#arrowhead);
+            }}
+            text {{
+                font-family: Arial, sans-serif;
+                font-size: 14px;
+                text-anchor: middle;
+            }}
+            .box-title {{
+                font-weight: bold;
+            }}
+        </style>
+        <defs>
+            <marker id="arrowhead" markerWidth="10" markerHeight="7" refX="9" refY="3.5" orient="auto">
+                <polygon points="0 0, 10 3.5, 0 7" />
+            </marker>
+        </defs>
+        <!-- Identification Section -->
+        <rect x="250" y="30" width="300" height="60" class="box" />
+        <text x="400" y="50" class="box-title">Identification</text>
+        <text x="400" y="75">Records identified through database searching</text>
+        <text x="400" y="90">(n = {records_db})</text>
+        <rect x="600" y="30" width="150" height="60" class="box" />
+        <text x="675" y="50" class="box-title">Additional</text>
+        <text x="675" y="75">Other sources</text>
+        <text x="675" y="90">(n = {records_other})</text>
+        <!-- Arrows -->
+        <line x1="400" y1="90" x2="400" y2="130" class="arrow" />
+        <line x1="675" y1="90" x2="675" y2="110" class="arrow" />
+        <line x1="675" y1="110" x2="400" y2="110" class="arrow" />
+        <!-- Screening Section -->
+        <rect x="250" y="130" width="300" height="60" class="box" />
+        <text x="400" y="150" class="box-title">Screening</text>
+        <text x="400" y="175">Records after duplicates removed</text>
+        <text x="400" y="190">(n = {records_after_duplicates})</text>
+        <line x1="400" y1="190" x2="400" y2="230" class="arrow" />
+        <rect x="250" y="230" width="300" height="60" class="box" />
+        <text x="400" y="250" class="box-title">Title/Abstract Screening</text>
+        <text x="400" y="275">Records screened</text>
+        <text x="400" y="290">(n = {records_after_duplicates})</text>
+        <rect x="600" y="230" width="150" height="60" class="box" />
+        <text x="675" y="255">Records excluded</text>
+        <text x="675" y="275">(n = {excluded_screening})</text>
+        <line x1="400" y1="290" x2="400" y2="330" class="arrow" />
+        <line x1="550" y1="260" x2="600" y2="260" class="arrow" />
+        <!-- Eligibility Section -->
+        <rect x="250" y="330" width="300" height="60" class="box" />
+        <text x="400" y="350" class="box-title">Eligibility</text>
+        <text x="400" y="375">Full-text articles assessed for eligibility</text>
+        <text x="400" y="390">(n = {fulltext_assessed})</text>
+        <rect x="600" y="330" width="150" height="60" class="box" />
+        <text x="675" y="350">Full-text articles</text>
+        <text x="675" y="370">excluded, with reasons</text>
+        <text x="675" y="390">(n = {excluded_fulltext})</text>
+        <line x1="400" y1="390" x2="400" y2="430" class="arrow" />
+        <line x1="550" y1="360" x2="600" y2="360" class="arrow" />
+        <!-- Included Section -->
+        <rect x="250" y="430" width="300" height="60" class="box" />
+        <text x="400" y="450" class="box-title">Included</text>
+        <text x="400" y="475">Studies included in qualitative synthesis</text>
+        <text x="400" y="490">(n = {included_studies})</text>
+        <!-- Optional Meta-Analysis Box -->
+        {f'''
+        <line x1="400" y1="490" x2="400" y2="530" class="arrow" />
+        <rect x="250" y="530" width="300" height="60" class="box" />
+        <text x="400" y="550" class="box-title">Meta-Analysis</text>
+        <text x="400" y="575">Studies included in quantitative synthesis</text>
+        <text x="400" y="590">(n = {included_meta})</text>
+        ''' if included_meta is not None else ''}
+        <!-- PRISMA Title -->
+        <text x="150" y="25" style="font-size: 18px; font-weight: bold; text-anchor: start;">PRISMA Flow Diagram</text>
+    </svg>
+    '''
+    return svg_content
 # Function to interact with OpenAI API for systematic review
+def generate_systematic_review(pdf_files, review_question, prisma_numbers, include_tables=True):
     if not api_key:
         return "Please enter your OpenAI API key first."
         Include a comprehensive reference list following a specific citation style (APA, Vancouver, etc.). Provide links to source papers when available.
         Your response should be formatted in HTML (but avoid showing these tags ```html ```) but generate the content to look like a professional academic paper. Include proper section headers, abstracts, methodology sections, etc. Number all sections like an academic paper. Follow academic journal standards with double spacing, appropriate margins, and consistent formatting throughout.
+        Make sure to include that you conducted a PRISMA flow diagram as part of the methodology section. Reference the PRISMA diagram in your methodology section and explain the numbers used in the diagram.
         """
         # Extract text from each PDF
         table_instruction = ""
         if include_tables:
             table_instruction = " Please include important new generated tables in your review."
+        # Add PRISMA flow information
+        prisma_info = f"""
+        Additionally, I have conducted a PRISMA flow diagram with the following data:
+        - Records identified through database searching: {prisma_numbers['records_db']}
+        - Additional records identified through other sources: {prisma_numbers['records_other']}
+        - Records after duplicates removed: {int(prisma_numbers['records_db']) + int(prisma_numbers['records_other']) - int(prisma_numbers['duplicates'])}
+        - Records excluded during title/abstract screening: {prisma_numbers['excluded_screening']}
+        - Full-text articles excluded with reasons: {prisma_numbers['excluded_fulltext']}
+        - Studies included in qualitative synthesis: {prisma_numbers['included_studies']}
+        """
+        if prisma_numbers.get('included_meta') and prisma_numbers['included_meta'].strip():
+            prisma_info += f"- Studies included in quantitative synthesis (meta-analysis): {prisma_numbers['included_meta']}\n"
+        user_prompt = f"Please generate a systematic review of the following {len(pdf_files)} papers: {', '.join(pdf_names)}.{table_instruction}\n\nReview Question: {review_question}\n\n{prisma_info}"
         # Create the messages for the API call
         messages = [
         # Get the AI response
         review_content = response["choices"][0]["message"]["content"]
+        # Generate PRISMA flow chart SVG
+        prisma_svg = generate_prisma_flow_chart(
+            int(prisma_numbers['records_db']),
+            int(prisma_numbers['records_other']),
+            int(prisma_numbers['duplicates']),
+            int(prisma_numbers['excluded_screening']),
+            int(prisma_numbers['excluded_fulltext']),
+            int(prisma_numbers['included_studies']),
+            int(prisma_numbers['included_meta']) if prisma_numbers.get('included_meta') and prisma_numbers['included_meta'].strip() else None
+        )
+        # Find a suitable place to insert the PRISMA flow chart
+        # Look for the methodology section or PRISMA mentions
+        prisma_html = f'''
+        <div class="prisma-flow-chart">
+            <h3>Figure 1: PRISMA Flow Diagram</h3>
+            {prisma_svg}
+        </div>
+        '''
+        # Try to insert PRISMA diagram after methodology section or before results
+        if "<h2>3. Methodology" in review_content:
+            parts = review_content.split("<h2>3. Methodology", 1)
+            if len(parts) > 1:
+                # Find the next h2 section after methodology
+                next_section = parts[1].find("<h2>")
+                if next_section > -1:
+                    review_content = parts[0] + "<h2>3. Methodology" + parts[1][:next_section] + prisma_html + parts[1][next_section:]
+                else:
+                    review_content = parts[0] + "<h2>3. Methodology" + parts[1] + prisma_html
+        else:
+            # If methodology section not found, insert before results or at the end
+            insert_pos = review_content.find("<h2>4.") if "<h2>4." in review_content else len(review_content) - 100
+            review_content = review_content[:insert_pos] + prisma_html + review_content[insert_pos:]
         # Apply professional academic paper styling
         styled_html = f"""
         <!DOCTYPE html>
                     font-size: 12px;
                     color: #777;
                 }}
+                .prisma-flow-chart {{
+                    margin: 30px 0;
+                    text-align: center;
+                }}
+                .prisma-flow-chart h3 {{
+                    margin-bottom: 15px;
+                }}
                 @media print {{
                     body {{
                         background-color: white;
         border-radius: 8px;
     }
+    /* PRISMA Flow Chart Container */
+    .prisma-section {
+        background-color: white;
+        padding: 20px;
+        border-radius: 8px;
+        box-shadow: 0 2px 10px rgba(0,0,0,0.05);
+        margin-bottom: 20px;
+    }
+    .prisma-form {
+        display: grid;
+        grid-template-columns: 1fr 1fr;
+        gap: 15px;
+    }
     /* Responsive adjustments */
     @media screen and (max-width: 768px) {
         .gradio-container {
             padding: 10px;
         }
+        .prisma-form {
+            grid-template-columns: 1fr;
+        }
     }
 </style>
 """
 # Gradio UI Layout with improved styling
 with gr.Blocks(css=custom_css) as demo:
+    gr.Markdown("# Systematic Review Generator with PRISMA Flow Chart")
     with gr.Accordion("How to Use This App", open=False):
         gr.Markdown("""
         1. Enter your OpenAI API key in the field below and click "Set API Key"
         2. Upload multiple PDF research papers (2 or more recommended)
         3. Enter your review question or topic
+        4. Fill in the PRISMA flow chart information (numbers at each stage of your review)
+        5. Check the "Include Tables" option if you want the review to include comparison tables
+        6. Click "Generate Systematic Review" to start the process
+        7. After generation, you can download the review as HTML
+        ### PRISMA Flow Chart:
+        - The PRISMA (Preferred Reporting Items for Systematic Reviews and Meta-Analyses) flow diagram shows the flow of information through the different phases of your systematic review
+        - Fill in the numbers for each stage to generate an accurate diagram
+        - The diagram will be embedded in your systematic review
         ### Tips for Best Results:
         - Upload papers that are related to the same research topic or field
                 placeholder="e.g., What are the effects of mindfulness meditation on stress reduction?"
             )
             include_tables = gr.Checkbox(label="Include Comparison Tables", value=True)
+    # PRISMA Flow Chart inputs
+    with gr.Row(elem_classes="prisma-section"):
+        with gr.Column():
+            gr.Markdown("### PRISMA Flow Chart Information")
+            gr.Markdown("Enter the numbers for each stage of your systematic review process:")
+            with gr.Row(elem_classes="prisma-form"):
+                prisma_records_db = gr.Textbox(label="Records from database searching", value="100", placeholder="e.g., 100")
+                prisma_records_other = gr.Textbox(label="Records from other sources", value="20", placeholder="e.g., 20")
+                prisma_duplicates = gr.Textbox(label="Duplicates removed", value="15", placeholder="e.g., 15")
+                prisma_excluded_screening = gr.Textbox(label="Records excluded at screening", value="60", placeholder="e.g., 60")
+                prisma_excluded_fulltext = gr.Textbox(label="Full-text articles excluded", value="30", placeholder="e.g., 30")
+                prisma_included_studies = gr.Textbox(label="Studies included in synthesis", value="15", placeholder="e.g., 15")
+                prisma_included_meta = gr.Textbox(label="Studies in meta-analysis (optional)", value="10", placeholder="e.g., 10")
             generate_button = gr.Button("Generate Systematic Review", elem_id="generate_button", size="large")
     # Download link container
     api_key_button.click(set_api_key, inputs=[api_key_input], outputs=[api_key_output])
     # Generate systematic review
+    def process_files_and_generate_review(files, question, include_tables,
+                                           records_db, records_other, duplicates,
+                                           excluded_screening, excluded_fulltext,
+                                           included_studies, included_meta):
         if not files:
             return ("""
             <div style="padding: 20px; border: 1px solid #e0e0e0; border-radius: 5px; background-color: #f9f9f9;">
         # Show loading message
         loading_message = """
         <div style="padding: 20px; text-align: center;">
+            <h3>Generating Systematic Review with PRISMA Flow Chart...</h3>
             <p>This may take a few minutes depending on the number and size of papers.</p>
             <div style="width: 100%; height: 4px; background-color: #f0f0f0; margin: 20px 0; border-radius: 2px; overflow: hidden;">
                 <div style="width: 30%; height: 100%; background: linear-gradient(90deg, #4a00e0, #8e2de2); animation: progress 2s infinite linear;"></div>
         yield loading_message, ""
+        # Collect PRISMA flow chart data
+        prisma_numbers = {
+            'records_db': records_db,
+            'records_other': records_other,
+            'duplicates': duplicates,
+            'excluded_screening': excluded_screening,
+            'excluded_fulltext': excluded_fulltext,
+            'included_studies': included_studies,
+            'included_meta': included_meta
+        }
+        # Generate review with PRISMA flow chart
+        review = generate_systematic_review(saved_paths, question, prisma_numbers, include_tables)
         # Create HTML download link
         html_link = create_html_download_link(review)
     generate_button.click(
         process_files_and_generate_review,
+        inputs=[pdf_files, review_question, include_tables,
+                prisma_records_db, prisma_records_other, prisma_duplicates,
+                prisma_excluded_screening, prisma_excluded_fulltext,
+                prisma_included_studies, prisma_included_meta],
         outputs=[review_output, download_html_output]
     )