Spaces:

jaisun2004
/

atmasessionsummarizer

Running on CPU Upgrade

File size: 7,146 Bytes


import streamlit as st
from transformers import pipeline
from pydub import AudioSegment
import os
import re
from docx import Document
from docx.shared import Pt
from docx.enum.text import WD_PARAGRAPH_ALIGNMENT
from datetime import datetime

# Page config
st.set_page_config(page_title="Atma.ai - Session Summarizer + Export", layout="wide")

st.title("🧠 Atma.ai – Advanced Mental Health Session Summarizer")
st.markdown("Upload a therapy session audio (Tamil-English mix) to view the transcript, summary, emotional analysis, and export everything to Word!")

# Upload audio
uploaded_file = st.file_uploader("🎙️ Upload audio file", type=["wav", "mp3", "m4a"])

if uploaded_file:
    st.audio(uploaded_file)

    # Convert audio to required format
    audio_path = "temp_audio.wav"
    audio = AudioSegment.from_file(uploaded_file)
    audio = audio.set_channels(1).set_frame_rate(16000)
    audio.export(audio_path, format="wav")

    try:
        # Transcribe
        st.info("🔄 Transcribing with Whisper (mixed-language support)...")
        asr = pipeline("automatic-speech-recognition", model="openai/whisper-large")
        result = asr(audio_path, return_timestamps=True, generate_kwargs={"language": "<|en|>"})
        raw_transcript = result.get("text", "")

        if not raw_transcript:
            st.error("❌ Could not generate a transcript. Please try a different audio.")
        else:
            # Simulated Speaker Diarization
            st.info("🗣️ Simulating speaker separation...")
            sentences = re.split(r'(?<=[.?!])\s+', raw_transcript)
            diarized_transcript = ""
            for idx, sentence in enumerate(sentences):
                speaker = "Speaker 1" if idx % 2 == 0 else "Speaker 2"
                diarized_transcript += f"{speaker}: {sentence}\n\n"

            
            # Static Session Context Recall
            st.info("🔍 Loading previous session context...")
            past_sessions = [
                {"date": "2024-04-15", "coping": "walking", "emotion": "anxiety", "notes": "high workload"},
                {"date": "2024-04-22", "coping": "journaling", "emotion": "stress", "notes": "difficulty sleeping"}
            ]
            rag_context = "\n".join([f"Session {i+1}: {s['coping']}, {s['emotion']}, {s['notes']}" for i, s in enumerate(past_sessions)])

            prompt_input = f"""Previous session context:\n{rag_context}\n\nCurrent session:\n{raw_transcript}"""

            # Summarization
            st.info("📋 Summarizing conversation...")
            summarizer = pipeline("summarization", model="philschmid/bart-large-cnn-samsum")
            summary = summarizer(prompt_input, max_length=256, min_length=60, do_sample=False)

            # Emotion tagging
            st.info("🎭 Extracting emotional tones...")
            emotion_model = pipeline("text-classification", model="j-hartmann/emotion-english-distilroberta-base", return_all_scores=True)
            emotion_scores = emotion_model(raw_transcript)

            # Layout with Tabs
            
import matplotlib.pyplot as plt

# Add trends tab to UI
tab1, tab2, tab3, tab4 = st.tabs(["📝 Transcript", "📋 Summary", "💬 Emotions", "📈 Trends"])

# Plot session trend (static mock data)
with tab4:
    st.subheader("📈 Emotional Trends Over Time")

    session_dates = ["2024-04-01", "2024-04-08", "2024-04-15", "2024-04-22"]
    anxiety_scores = [70, 65, 55, 40]
    sadness_scores = [30, 20, 25, 15]

    fig, ax = plt.subplots()
    ax.plot(session_dates, anxiety_scores, label='Anxiety', marker='o')
    ax.plot(session_dates, sadness_scores, label='Sadness', marker='o')
    ax.set_title("Emotional Trends Over Time")
    ax.set_ylabel("Score (%)")
    ax.set_xlabel("Session Date")
    ax.legend()
    st.pyplot(fig)


            with tab1:
                st.subheader("📝 Speaker-Simulated Transcript")
                st.markdown(diarized_transcript, unsafe_allow_html=True)

            with tab2:
                st.subheader("📋 Contextual Summary")
                
            # Insight Tracking based on previous sessions
            insights = []
            if "music" in raw_transcript.lower():
                if any("walking" in s["coping"] for s in past_sessions):
                    insights.append("Patient previously mentioned walking as a helpful coping mechanism. This time, music is highlighted instead.")
            if "sleep" in raw_transcript.lower():
                insights.append("Sleep continues to be a recurring theme across sessions.")
            final_output = f"{summary[0]['summary_text']}\n\nContextual Observations:\n" + "\n".join(insights)
            st.write(final_output)
    

            with tab3:
                st.subheader("💬 Emotional Insights (Overall)")
                for emo in emotion_scores[0]:
                    st.write(f"{emo['label']}: {round(emo['score']*100, 2)}%")

            # Export Button
            st.subheader("📥 Export Session Report")

            def generate_docx(transcript, summary_text, emotions):
                doc = Document()

                # Title
                title = doc.add_heading('Session Summary - Atma.ai', 0)
                title.alignment = WD_PARAGRAPH_ALIGNMENT.CENTER

                # Date
                date_paragraph = doc.add_paragraph(f"Date: {datetime.now().strftime('%Y-%m-%d')}")
                date_paragraph.runs[0].italic = True

                doc.add_paragraph("\n")

                # Transcript
                doc.add_heading('📝 Transcript', level=1)
                transcript_para = doc.add_paragraph(transcript)
                transcript_para.runs[0].font.size = Pt(12)

                doc.add_paragraph("\n")

                # Summary
                doc.add_heading('📋 Summary', level=1)
                summary_para = doc.add_paragraph(summary_text)
                summary_para.runs[0].font.size = Pt(12)

                doc.add_paragraph("\n")

                # Emotional Insights
                doc.add_heading('💬 Emotional Insights', level=1)
                for emo in emotions[0]:
                    emotion_para = doc.add_paragraph(f"{emo['label']}: {round(emo['score']*100, 2)}%")
                    emotion_para.runs[0].font.size = Pt(12)

                # Footer
                doc.add_paragraph("\n\n---\nGenerated by Atma.ai – Confidential", style="Intense Quote")

                output_path = "session_summary.docx"
                doc.save(output_path)
                return output_path

            if st.button("Generate and Download Report (.docx)"):
                output_file = generate_docx(diarized_transcript, summary[0]["summary_text"], emotion_scores)
                with open(output_file, "rb") as f:
                    st.download_button(label="📥 Download Report", data=f, file_name="session_summary.docx", mime="application/vnd.openxmlformats-officedocument.wordprocessingml.document")

    except Exception as err:
        st.error(f"❌ Processing failed: {err}")
    finally:
        if os.path.exists(audio_path):
            os.remove(audio_path)