Spaces:

irfansaleem48
/

AI_Meeting_Assistant

Sleeping

App Files Files Community

irfansaleem48 commited on Feb 23

Commit

5a00d25

verified ·

1 Parent(s): d48624f

Update app.py

Browse files

Files changed (1) hide show

app.py +15 -7

app.py CHANGED Viewed

@@ -8,7 +8,7 @@ import os
 @st.cache_resource
 def load_models():
-    whisper_model = whisper.load_model("base")
     summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
     nlp = spacy.load("en_core_web_sm")
     return whisper_model, summarizer, nlp
@@ -41,19 +41,28 @@ def main():
     whisper_model, summarizer, nlp = load_models()
-    audio_file = st.file_uploader("Upload meeting audio", type=["wav", "mp3", "m4a"])
     if audio_file is not None:
-        file_path = f"uploaded_audio_{datetime.datetime.now().timestamp()}"
         with open(file_path, "wb") as f:
             f.write(audio_file.getbuffer())
         st.subheader("Meeting Transcription")
         with st.spinner("Transcribing audio..."):
             result = whisper_model.transcribe(file_path)
             transcript = result["text"]
         st.write(transcript)
-        os.remove(file_path)
         st.subheader("Meeting Summary")
         with st.spinner("Generating summary..."):
@@ -78,10 +87,9 @@ def main():
                 """)
         st.subheader("🔑 Key Terms")
-        # Fixed keyword processing
         key_phrases_result = keywords.keywords(transcript) or ""
         key_phrases = [kp.strip() for kp in key_phrases_result.split("\n") if kp.strip()]
         st.write(", ".join(key_phrases) if key_phrases else "No key terms extracted")
 if __name__ == "__main__":
-    main()

 @st.cache_resource
 def load_models():
+    whisper_model = whisper.load_model("base")  # You can use 'small' or 'medium' for better results
     summarizer = pipeline("summarization", model="facebook/bart-large-cnn")
     nlp = spacy.load("en_core_web_sm")
     return whisper_model, summarizer, nlp
     whisper_model, summarizer, nlp = load_models()
+    audio_file = st.file_uploader("Upload meeting audio", type=["wav", "mp3", "m4a", "ogg", "flac"])
     if audio_file is not None:
+        file_path = f"uploaded_audio_{datetime.datetime.now().timestamp()}.wav"
+        # Save uploaded file
         with open(file_path, "wb") as f:
             f.write(audio_file.getbuffer())
         st.subheader("Meeting Transcription")
         with st.spinner("Transcribing audio..."):
+            # Load and process audio
+            audio = whisper.load_audio(file_path)  # Converts to 16kHz mono
+            audio = whisper.pad_or_trim(audio)  # Ensures proper input size
+            mel = whisper.log_mel_spectrogram(audio).to(whisper_model.device)
+            # Transcribe
             result = whisper_model.transcribe(file_path)
             transcript = result["text"]
         st.write(transcript)
+        os.remove(file_path)  # Cleanup
         st.subheader("Meeting Summary")
         with st.spinner("Generating summary..."):
                 """)
         st.subheader("🔑 Key Terms")
         key_phrases_result = keywords.keywords(transcript) or ""
         key_phrases = [kp.strip() for kp in key_phrases_result.split("\n") if kp.strip()]
         st.write(", ".join(key_phrases) if key_phrases else "No key terms extracted")
 if __name__ == "__main__":
+    main()