Spaces:

developer28
/

Youtubedownloader

Sleeping

App Files Files Community

developer28 commited on 9 days ago

Commit

168cef5

verified ·

1 Parent(s): 3e5d7ea

Update app.py

Browse files

Files changed (1) hide show

app.py +31 -30

app.py CHANGED Viewed

@@ -13,7 +13,7 @@ try:
 except:
     WHISPER_AVAILABLE = False
-# ✅ Download audio from YouTube
 def download_audio(url, cookies_path=None):
     try:
         temp_dir = tempfile.mkdtemp()
@@ -25,15 +25,9 @@ def download_audio(url, cookies_path=None):
             'quiet': True,
             'noplaylist': True,
             'cookiefile': cookies_path if cookies_path else None,
-            'user_agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)',
             'referer': 'https://www.youtube.com/',
             'force_ipv4': True,
-            'http_headers': {
-                'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64)',
-                'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,*/*;q=0.8',
-                'Accept-Language': 'en-US,en;q=0.5',
-                'Referer': 'https://www.youtube.com/'
-            },
         }
         with YoutubeDL(ydl_opts) as ydl:
@@ -50,7 +44,7 @@ def download_audio(url, cookies_path=None):
         traceback.print_exc()
         return None, f"❌ Download error: {str(e)}"
-# ✅ Transcribe audio using Whisper
 def transcribe_audio(path):
     if not WHISPER_AVAILABLE:
         return "❌ Whisper not available. Please install openai-whisper."
@@ -62,13 +56,13 @@ def transcribe_audio(path):
         traceback.print_exc()
         return f"❌ Transcription failed: {str(e)}"
-# ✅ Extract stock-related information
 def extract_stock_info(text):
     try:
         companies = re.findall(r'\b[A-Z][a-z]+(?: [A-Z][a-z]+)*\b', text)
         symbols = re.findall(r'\b[A-Z]{2,5}\b', text)
         prices = re.findall(r'\$\d+(?:\.\d{1,2})?', text)
-        actions = re.findall(r'\b(buy|sell|hold|target|bullish|bearish|stop loss)\b', text, re.IGNORECASE)
         result = "=== STOCK RECOMMENDATION ANALYSIS ===\n\n"
         if companies:
@@ -82,7 +76,7 @@ def extract_stock_info(text):
         recommendations = []
         for line in text.split("."):
-            if any(word in line.lower() for word in ['buy', 'sell', 'target', 'hold']):
                 recommendations.append(line.strip())
         if recommendations:
@@ -98,7 +92,7 @@ def extract_stock_info(text):
     except Exception as e:
         return f"❌ Stock info extraction failed: {str(e)}"
-# ✅ Save uploaded cookies.txt
 def save_cookies(file):
     if file is None:
         return None
@@ -115,11 +109,11 @@ def save_cookies(file):
         print(f"❌ Failed to handle cookies.txt: {e}")
         return None
-# ✅ YouTube pipeline
-def run_pipeline(url, cookies_file):
     try:
         if not WHISPER_AVAILABLE:
-            return "❌ Whisper is not installed. Run: pip install openai-whisper", ""
         if not url:
             return "❌ YouTube URL required", ""
@@ -133,22 +127,24 @@ def run_pipeline(url, cookies_file):
             return transcript, ""
         stock_info = extract_stock_info(transcript)
-        return "✅ Complete", stock_info
     except Exception as e:
         tb = traceback.format_exc()
         print(tb)
         return f"❌ Unhandled Error:\n{tb}", ""
-# ✅ Audio file upload pipeline
-def run_pipeline_audio(audio_file):
     try:
         if not WHISPER_AVAILABLE:
-            return "❌ Whisper is not installed. Run: pip install openai-whisper", ""
         if audio_file is None:
             return "❌ No audio file uploaded", ""
-        # Handle both file-like and NamedString (path string)
         temp_audio_path = tempfile.mktemp(suffix=os.path.splitext(str(audio_file))[-1])
         if hasattr(audio_file, "read"):
             with open(temp_audio_path, "wb") as f:
@@ -161,35 +157,40 @@ def run_pipeline_audio(audio_file):
             return transcript, ""
         stock_info = extract_stock_info(transcript)
-        return "✅ Complete", stock_info
     except Exception as e:
         tb = traceback.format_exc()
         print(tb)
         return f"❌ Unhandled Error:\n{tb}", ""
-# ✅ Gradio UI
 with gr.Blocks(title="Stock Insights from YouTube or Audio") as demo:
     gr.Markdown("""
-    # 🎧 Extract Stock Recommendations from YouTube or Uploaded Audio
-    Upload a YouTube URL or an audio file. We'll transcribe it and extract stock-related insights!
     """)
     with gr.Tab("📺 From YouTube Video"):
         with gr.Row():
-            url_input = gr.Textbox(label="🎥 YouTube Video URL")
             cookie_input = gr.File(label="cookies.txt (optional)", file_types=[".txt"])
         yt_run_btn = gr.Button("🚀 Extract from YouTube")
         yt_status = gr.Textbox(label="Status")
-        yt_result = gr.Textbox(label="Stock Info", lines=12)
-        yt_run_btn.click(fn=run_pipeline, inputs=[url_input, cookie_input], outputs=[yt_status, yt_result])
     with gr.Tab("🎵 From Uploaded Audio"):
         audio_input = gr.File(label="Upload Audio File", file_types=[".mp3", ".wav", ".m4a", ".webm"])
         audio_run_btn = gr.Button("🚀 Extract from Audio")
         audio_status = gr.Textbox(label="Status")
-        audio_result = gr.Textbox(label="Stock Info", lines=12)
-        audio_run_btn.click(fn=run_pipeline_audio, inputs=[audio_input], outputs=[audio_status, audio_result])
 if __name__ == "__main__":
     demo.launch(debug=True)

 except:
     WHISPER_AVAILABLE = False
+# Download audio from YouTube
 def download_audio(url, cookies_path=None):
     try:
         temp_dir = tempfile.mkdtemp()
             'quiet': True,
             'noplaylist': True,
             'cookiefile': cookies_path if cookies_path else None,
+            'user_agent': 'Mozilla/5.0',
             'referer': 'https://www.youtube.com/',
             'force_ipv4': True,
         }
         with YoutubeDL(ydl_opts) as ydl:
         traceback.print_exc()
         return None, f"❌ Download error: {str(e)}"
+# Transcribe using Whisper
 def transcribe_audio(path):
     if not WHISPER_AVAILABLE:
         return "❌ Whisper not available. Please install openai-whisper."
         traceback.print_exc()
         return f"❌ Transcription failed: {str(e)}"
+# Extract stock insights
 def extract_stock_info(text):
     try:
         companies = re.findall(r'\b[A-Z][a-z]+(?: [A-Z][a-z]+)*\b', text)
         symbols = re.findall(r'\b[A-Z]{2,5}\b', text)
         prices = re.findall(r'\$\d+(?:\.\d{1,2})?', text)
+        actions = re.findall(r'\b(buy|sell|hold|target|bullish|bearish|stop loss|accumulate|short|take profit|entry|exit)\b', text, re.IGNORECASE)
         result = "=== STOCK RECOMMENDATION ANALYSIS ===\n\n"
         if companies:
         recommendations = []
         for line in text.split("."):
+            if any(word in line.lower() for word in ['buy', 'sell', 'target', 'hold', 'accumulate', 'short', 'entry', 'exit']):
                 recommendations.append(line.strip())
         if recommendations:
     except Exception as e:
         return f"❌ Stock info extraction failed: {str(e)}"
+# Save cookies
 def save_cookies(file):
     if file is None:
         return None
         print(f"❌ Failed to handle cookies.txt: {e}")
         return None
+# YouTube flow
+def run_pipeline(url, cookies_file, show_transcript):
     try:
         if not WHISPER_AVAILABLE:
+            return "❌ Whisper not installed", ""
         if not url:
             return "❌ YouTube URL required", ""
             return transcript, ""
         stock_info = extract_stock_info(transcript)
+        if show_transcript:
+            return "✅ Complete", f"📜 Transcript:\n\n{transcript}\n\n\n{stock_info}"
+        else:
+            return "✅ Complete", stock_info
     except Exception as e:
         tb = traceback.format_exc()
         print(tb)
         return f"❌ Unhandled Error:\n{tb}", ""
+# Audio upload flow
+def run_pipeline_audio(audio_file, show_transcript):
     try:
         if not WHISPER_AVAILABLE:
+            return "❌ Whisper not installed", ""
         if audio_file is None:
             return "❌ No audio file uploaded", ""
         temp_audio_path = tempfile.mktemp(suffix=os.path.splitext(str(audio_file))[-1])
         if hasattr(audio_file, "read"):
             with open(temp_audio_path, "wb") as f:
             return transcript, ""
         stock_info = extract_stock_info(transcript)
+        if show_transcript:
+            return "✅ Complete", f"📜 Transcript:\n\n{transcript}\n\n\n{stock_info}"
+        else:
+            return "✅ Complete", stock_info
     except Exception as e:
         tb = traceback.format_exc()
         print(tb)
         return f"❌ Unhandled Error:\n{tb}", ""
+# Gradio UI
 with gr.Blocks(title="Stock Insights from YouTube or Audio") as demo:
     gr.Markdown("""
+    # 📈 Extract Stock Recommendations from YouTube or Uploaded Audio
+    Upload a YouTube video or audio file. We'll transcribe it using Whisper and extract stock insights.
     """)
     with gr.Tab("📺 From YouTube Video"):
         with gr.Row():
+            url_input = gr.Textbox(label="🎥 YouTube URL")
             cookie_input = gr.File(label="cookies.txt (optional)", file_types=[".txt"])
+        show_transcript_yt = gr.Checkbox(label="Show Transcript", value=False)
         yt_run_btn = gr.Button("🚀 Extract from YouTube")
         yt_status = gr.Textbox(label="Status")
+        yt_result = gr.Textbox(label="Transcript & Stock Info", lines=15)
+        yt_run_btn.click(fn=run_pipeline, inputs=[url_input, cookie_input, show_transcript_yt], outputs=[yt_status, yt_result])
     with gr.Tab("🎵 From Uploaded Audio"):
         audio_input = gr.File(label="Upload Audio File", file_types=[".mp3", ".wav", ".m4a", ".webm"])
+        show_transcript_audio = gr.Checkbox(label="Show Transcript", value=False)
         audio_run_btn = gr.Button("🚀 Extract from Audio")
         audio_status = gr.Textbox(label="Status")
+        audio_result = gr.Textbox(label="Transcript & Stock Info", lines=15)
+        audio_run_btn.click(fn=run_pipeline_audio, inputs=[audio_input, show_transcript_audio], outputs=[audio_status, audio_result])
 if __name__ == "__main__":
     demo.launch(debug=True)