Spaces:

Manasa1
/

VIDEO_SEARCH_SUMMARIZER

Running

App Files Files Community

Manasa1 commited on Jan 12

Commit

abc673c

verified ·

1 Parent(s): 4f990da

Update app.py

Browse files

Files changed (1) hide show

app.py +139 -143

app.py CHANGED Viewed

@@ -1,25 +1,27 @@
 import streamlit as st
 from phi.agent import Agent
 from phi.model.google import Gemini
 from phi.tools.duckduckgo import DuckDuckGo
 from phi.tools.youtube_tools import YouTubeTools
 import google.generativeai as genai
 import time
 from pathlib import Path
 import tempfile
-from dotenv import load_dotenv
 import os
 # Load environment variables
 load_dotenv()
-# Configure Gemini API
 API_KEY = os.getenv("GOOGLE_API_KEY")
-if not API_KEY:
-    st.error("Please set the GOOGLE_API_KEY environment variable")
-    st.stop()
-genai.configure(api_key=API_KEY)
 # Page configuration
 st.set_page_config(
@@ -29,162 +31,156 @@ st.set_page_config(
 )
 st.title("Phidata Video AI Summarizer Agent 🎥🎤🖬")
-st.header("Powered by Gemini 2.0 Flash Exp")
-# Initialize agents
-@st.cache_resource
-def initialize_multimodal_agent():
-    return Agent(
-        name="Video AI Summarizer",
-        model=Gemini(id="gemini-2.0-flash-exp"),
-        tools=[DuckDuckGo(), YouTubeTools()],
-        markdown=True,
-    )
-@st.cache_resource
-def initialize_youtube_agent():
-    return Agent(
-        name="YouTube Summarizer",
-        model=Gemini(id="gemini-2.0-flash-exp"),
-        tools=[YouTubeTools()],
-        get_youtube_video_captions = True,
-        show_tool_calls=True,
-        description="You are a YouTube agent. Obtain the captions of a YouTube video and answer questions.",
-        markdown=True,
-    )
-multimodal_Agent = initialize_multimodal_agent()
-youtube_agent = initialize_youtube_agent()
-def generate_analysis_prompt(query, video_source):
-    return f"""
-    Analyze the {video_source} for content and context.
-    Key areas to address:
-    1. Main topics and themes
-    2. Key points and insights
-    3. Specific answer to user query: {query}
-    4. Supporting context from web research
-    Provide a structured, detailed response with clear sections and actionable insights.
-    """
-# Create tabs for different input methods
-video_tab, youtube_tab = st.tabs(["Upload Video", "YouTube URL"])
-# Upload Video Tab
-with video_tab:
-    upload_query = st.text_area(
-        "What insights are you seeking from the uploaded video?",
-        placeholder="Ask anything about the video content. The AI agent will analyze and gather additional context if needed.",
-        help="Provide specific questions or insights you want from the uploaded video.",
-        key="upload_query"
-    )
     video_file = st.file_uploader(
-        "Upload a video file",
-        type=['mp4', 'mov', 'avi'],
-        help="Upload a video for AI analysis"
     )
     if video_file:
-        st.video(video_file, format="video/mp4", start_time=0)
-        if st.button("🔍 Analyze Uploaded Video", use_container_width=True):
-            if not upload_query:
                 st.warning("Please enter a question or insight to analyze the video.")
             else:
                 try:
                     with st.spinner("Processing video and gathering insights..."):
-                        # Create temporary file
-                        with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as temp_video:
-                            temp_video.write(video_file.getvalue())
-                            video_path = temp_video.name
-                        # Upload and process video
-                        processed_video = genai.upload_file(video_path)
-                        # Wait for processing with timeout
-                        timeout = 60  # 60 seconds timeout
-                        start_time = time.time()
                         while processed_video.state.name == "PROCESSING":
-                            if time.time() - start_time > timeout:
-                                raise TimeoutError("Video processing timed out")
                             time.sleep(1)
-                            processed_video = genai.get_file(processed_video.name)
-                        # Generate and run analysis
-                        analysis_prompt = generate_analysis_prompt(upload_query, "uploaded video")
                         response = multimodal_Agent.run(analysis_prompt, videos=[processed_video])
-                        # Display results
-                        st.success("Analysis complete!")
-                        st.subheader("Analysis Results")
-                        st.markdown(response.content)
-                except TimeoutError:
-                    st.error("Video processing timed out. Please try with a shorter video.")
                 except Exception as error:
-                    st.error(f"An error occurred: {str(error)}")
                 finally:
-                    # Clean up temporary file
                     Path(video_path).unlink(missing_ok=True)
     else:
-        st.info("Please upload a video file to begin analysis.")
-# YouTube URL Tab
-with youtube_tab:
-    youtube_query = st.text_area(
-        "What would you like to know about the YouTube video?",
-        placeholder="Ask specific questions about the video or leave empty for a general summary.",
-        help="Enter your question about the YouTube video or leave blank for a general summary.",
-        key="youtube_query"
-    )
-    youtube_url = st.text_input(
-        "Paste a YouTube URL:",
-        placeholder="https://www.youtube.com/watch?v=..."
-    )
-    if youtube_url:
-        if st.button("🔍 Analyze YouTube Video", use_container_width=True):
-            try:
-                with st.spinner("Fetching video content and analyzing..."):
-                    # Generate prompt based on whether there's a user query
-                    youtube_prompt = generate_analysis_prompt(youtube_query, youtube_url)
-                    # Use the YouTube-specific agent to process the video
-                    response = youtube_agent.run(youtube_prompt, markdown=True)
-                    # Display results
-                    st.success("Analysis complete!")
-                    st.subheader("Analysis Results")
-                    st.markdown(response.content)
-            except Exception as error:
-                st.error(f"An error occurred: {str(error)}")
     else:
-        st.info("Please enter a YouTube URL to begin analysis.")
-# Custom styling
-st.markdown(
-    """
-    <style>
-    .stTextArea textarea {
-        height: 100px;
-    }
-    .stButton button {
-        background-color: #FF4B4B;
-        color: white;
-        font-weight: bold;
-    }
-    .stButton button:hover {
-        background-color: #FF3333;
-    }
-    </style>
-    """,
-    unsafe_allow_html=True
-)

 import streamlit as st
 from phi.agent import Agent
 from phi.model.google import Gemini
+from phi.model.groq import Groq
 from phi.tools.duckduckgo import DuckDuckGo
 from phi.tools.youtube_tools import YouTubeTools
+from google.generativeai import upload_file, get_file
 import google.generativeai as genai
+from dotenv import load_dotenv
 import time
 from pathlib import Path
 import tempfile
 import os
 # Load environment variables
 load_dotenv()
+# Google API Key
 API_KEY = os.getenv("GOOGLE_API_KEY")
+if API_KEY:
+    genai.configure(api_key=API_KEY)
+# Groq API Key
+groq_api_key = os.getenv("Groq_Api_key")
 # Page configuration
 st.set_page_config(
 )
 st.title("Phidata Video AI Summarizer Agent 🎥🎤🖬")
+# Tabs for video upload and YouTube summarization
+tab1, tab2 = st.tabs(["🎥 Video Upload", "🌐 YouTube Summarizer"])
+# Tab 1: Video Upload and Analysis
+with tab1:
+    st.header("🎥 Analyze Uploaded Video")
+    st.subheader("Powered by Gemini 2.0 Flash Exp")
+    @st.cache_resource
+    def initialize_multimodal_agent():
+        return Agent(
+            name="Video AI Summarizer",
+            model=Gemini(id="gemini-2.0-flash-exp"),
+            tools=[DuckDuckGo()],
+            markdown=True,
+        )
+    multimodal_Agent = initialize_multimodal_agent()
+    # File uploader
     video_file = st.file_uploader(
+        "Upload a video file", type=['mp4', 'mov', 'avi'], help="Upload a video for AI analysis"
     )
     if video_file:
+        with tempfile.NamedTemporaryFile(delete=False, suffix='.mp4') as temp_video:
+            temp_video.write(video_file.read())
+            video_path = temp_video.name
+        st.video(video_path, format="video/mp4", start_time=0)
+        user_query = st.text_area(
+            "What insights are you seeking from the video?",
+            placeholder="Ask anything about the video content. The AI agent will analyze and gather additional context if needed.",
+            help="Provide specific questions or insights you want from the video."
+        )
+        if st.button("🔍 Analyze Video", key="analyze_video_button"):
+            if not user_query:
                 st.warning("Please enter a question or insight to analyze the video.")
             else:
                 try:
                     with st.spinner("Processing video and gathering insights..."):
+                        # Upload and process video file
+                        processed_video = upload_file(video_path)
                         while processed_video.state.name == "PROCESSING":
                             time.sleep(1)
+                            processed_video = get_file(processed_video.name)
+                        # Prompt generation for analysis
+                        analysis_prompt = (
+                            f"""
+                            Analyze the uploaded video for content and context.
+                            Respond to the following query using video insights and supplementary web research:
+                            {user_query}
+                            Provide a detailed, user-friendly, and actionable response.
+                            """
+                        )
+                        # AI agent processing
                         response = multimodal_Agent.run(analysis_prompt, videos=[processed_video])
+                    # Display the result
+                    st.subheader("Analysis Result")
+                    st.markdown(response.content)
                 except Exception as error:
+                    st.error(f"An error occurred during analysis: {error}")
                 finally:
+                    # Clean up temporary video file
                     Path(video_path).unlink(missing_ok=True)
     else:
+        st.info("Upload a video file to begin analysis.")
+# Tab 2: YouTube Video Summarizer with Search Results
+with tab2:
+    st.header("🌐 Summarize and Analyze YouTube Videos with Search Results")
+    @st.cache_resource
+    def initialize_youtube_agent():
+        return Agent(
+            tools=[YouTubeTools(), DuckDuckGo()],
+            model=Groq(id="llama-3.3-70b-versatile", api_key=groq_api_key),
+            show_tool_calls=True,
+            description=(
+                "You are a YouTube agent. Obtain the captions of a YouTube video and answer questions"
+                "You are a YouTube analysis agent. Your task is to summarize videos, "
+                "identify key points, provide insights, and gather relevant search results for additional context."
+            ),
+        )
+    if not groq_api_key:
+        st.error("Groq API key not found. Ensure it is set in the .env file.")
     else:
+        youtube_agent = initialize_youtube_agent()
+        video_url = st.text_input("Enter YouTube video URL:")
+        user_query = st.text_area(
+            "What specific insights or analysis are you looking for?",
+            placeholder="For example: 'Summarize the video content, analyze the speaker's tone, and provide related key takeaways.'",
+            help="Provide specific instructions for a more detailed analysis of the YouTube video."
+        )
+        if st.button("Generate Analysis with Search Results", key="analyze_youtube_search_button"):
+            if not video_url.strip():
+                st.warning("Please enter a valid YouTube video URL.")
+            elif not user_query.strip():
+                st.warning("Please provide specific instructions for analysis.")
+            else:
+                with st.spinner("Processing video and generating insights..."):
+                    try:
+                        # Enhanced Prompt for Tab 2
+                        enhanced_prompt = (
+                            f"""
+                            Analyze the YouTube video available at: {video_url}
+                            Your task:
+                            - Watch and analyze the video content.
+                            - Summarize the main ideas, arguments, or points presented in the video.
+                            - Identify key takeaways, such as statistics, quotes, or important insights.
+                            - Analyze the speaker's tone, purpose, and the intended audience for the video.
+                            - Highlight any actionable insights, lessons, or suggestions the video provides.
+                            In addition to summarizing the video, perform a web search to gather supplementary information about the video's topic.
+                            For example:
+                            - Provide links to relevant blogs, articles, or news stories.
+                            - Highlight related insights or key trends from your search.
+                            - Suggest further reading materials for users who wish to dive deeper into the topic.
+                            Final Output:
+                            - Present the analysis in a concise, user-friendly format.
+                            - Structure the output clearly with headings for each section, such as 'Summary', 'Key Insights', 'Search Results', etc.
+                            - If any supplementary information conflicts with the video content, mention it explicitly.
+                            User Query/Focus:
+                            {user_query}
+                            """
+                        )
+                        # AI agent generates response for analysis and search
+                        response = youtube_agent.print_response(enhanced_prompt, markdown=True)
+                        # Display the results
+                        st.subheader("Video Analysis and Summary")
+                        st.markdown(response)
+                    except Exception as e:
+                        st.error(f"An error occurred: {e}")