YTB-TEST

Running

App Files Files Community

fantaxy commited on Jun 19

Commit

86335a9

verified ·

1 Parent(s): 9dd9c8e

Update app.py

Browse files

Files changed (1) hide show

app.py +0 -1131

app.py CHANGED Viewed

@@ -1,1137 +1,6 @@
 #!/usr/bin/env python3
 """
 YouTube Video Analyzer & Downloader Pro
-(쿠키 자동 처리 버전)
-· `www.youtube.com_cookies.txt` 파일이 **app.py**와 같은 폴더에 있으면
-  자동으로 사용합니다.
-· Gradio UI에서 쿠키 파일을 업로드하면, 업로드된 파일이 **우선** 적용됩니다.
-"""
-# ──────────────────────────────────────────────────────────────
-# 표준 라이브러리
-# ──────────────────────────────────────────────────────────────
-import os
-import re
-import json
-import uuid
-import shutil
-import tempfile
-from datetime import datetime
-from pathlib import Path
-# ──────────────────────────────────────────────────────────────
-# 외부 라이브러리
-# ──────────────────────────────────────────────────────────────
-import gradio as gr
-import yt_dlp
-import google.generativeai as genai
-# ───────── transcript_utils.py ─────────
-from youtube_transcript_api import YouTubeTranscriptApi
-from datetime import timedelta
-def fetch_transcript(video_id, lang_pref=("ko","en")):
-    # available_transcripts()가 1.1.0부터 추가됨
-    for lang in lang_pref:
-        try:
-            transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=[lang])
-            break
-        except Exception:
-            continue
-    else:
-        raise RuntimeError("자막을 찾을 수 없습니다.")
-    lines = []
-    for seg in transcript:
-        t = str(timedelta(seconds=int(seg["start"])))  # 0:01:23
-        t_mmss = ":".join(t.split(":")[-2:])           # 01:23
-        lines.append(f"**[{t_mmss}]** {seg['text']}")
-    return "\n".join(lines)
-# ──────────────────────────────────────────────────────────────
-# 기본 쿠키 파일 경로 ― 파일명이 동일하면 자동 사용
-# ──────────────────────────────────────────────────────────────
-DEFAULT_COOKIE_FILE = Path(__file__).with_name("www.youtube.com_cookies.txt")
-# =================================================================
-# Main Class
-# =================================================================
-class YouTubeDownloader:
-    def __init__(self):
-        # 임시 디렉터리 (Gradio 호환)
-        self.download_dir = tempfile.mkdtemp()
-        self.temp_downloads = tempfile.mkdtemp(prefix="youtube_downloads_")
-        # 사용자 Downloads 하위 폴더
-        self.downloads_folder = os.path.join(
-            os.path.expanduser("~"), "Downloads", "YouTube_Downloads"
-        )
-        os.makedirs(self.downloads_folder, exist_ok=True)
-        self.gemini_model = None
-    # ---------------------------------------------------------
-    # Google Gemini API
-    # ---------------------------------------------------------
-    def configure_gemini(self, api_key):
-        try:
-            genai.configure(api_key=api_key)
-            self.gemini_model = genai.GenerativeModel(
-                model_name="gemini-1.5-flash-latest"
-            )
-            return True, "✅ Gemini API configured successfully!"
-        except Exception as e:
-            return False, f"❌ Failed to configure Gemini API: {e}"
-    # ---------------------------------------------------------
-    # 임시 디렉터리 정리
-    # ---------------------------------------------------------
-    def cleanup(self):
-        try:
-            if hasattr(self, "download_dir") and os.path.exists(self.download_dir):
-                shutil.rmtree(self.download_dir)
-            if hasattr(self, "temp_downloads") and os.path.exists(self.temp_downloads):
-                shutil.rmtree(self.temp_downloads)
-        except Exception as e:
-            print(f"⚠️ Warning: Could not clean up temporary directory: {e}")
-    # ---------------------------------------------------------
-    # 유튜브 URL 검증
-    # ---------------------------------------------------------
-    def is_valid_youtube_url(self, url):
-        youtube_regex = re.compile(
-            r"(https?://)?(www\.)?"
-            r"(youtube|youtu|youtube-nocookie)\.(com|be)/"
-            r"(watch\?v=|embed/|v/|.+\?v=)?([^&=%\?]{11})"
-        )
-        return youtube_regex.match(url) is not None
-    # ---------------------------------------------------------
-    # Gemini-AI 장면 분석
-    # ---------------------------------------------------------
-    def generate_scene_breakdown_gemini(self, video_info):
-        if not self.gemini_model:
-            return self.generate_scene_breakdown_fallback(video_info)
-        try:
-            duration = video_info.get("duration", 0)
-            title = video_info.get("title", "")
-            description = video_info.get("description", "")[:1500]
-            if not duration:
-                return [
-                    "**[Duration Unknown]**: Unable to generate timestamped breakdown - "
-                    "video duration not available"
-                ]
-            prompt = f"""
-Analyze this YouTube video and create a highly detailed, scene-by-scene breakdown
-with precise timestamps and specific descriptions:
-Title: {title}
-Duration: {duration} seconds
-Description: {description}
-IMPORTANT INSTRUCTIONS:
-1. Create detailed scene descriptions that include:
-   - Physical appearance of people (age, gender, clothing, hair, etc.)
-   - Exact actions being performed
-   - Dialogue or speech (include actual lines if audible, or infer probable spoken
-     lines based on actions and setting; format them as "Character: line…")
-   - Setting and environment details
-   - Props, objects, or products being shown
-   - Visual effects, text overlays, or graphics
-   - Mood, tone, and atmosphere
-   - Camera movements or angles (if apparent)
-2. Dialogue Emphasis:
-   - Include short dialogue lines in **every scene** wherever plausible.
-   - Write lines like: Character: "Actual or inferred line…"
-   - If dialogue is not available, intelligently infer probable phrases
-     (e.g., "Welcome!", "Try this now!", "It feels amazing!").
-3. Timestamp Guidelines:
-   - For videos under 1 minute: 2-3 second segments
-   - For videos 1-5 minutes: 3-5 second segments
-   - For videos 5-15 minutes: 5-10 second segments
-   - For videos over 15 minutes: 10-15 second segments
-   - Maximum 20 scenes total for longer videos
-4. Format each scene EXACTLY like this:
-   **[MM:SS-MM:SS]**: Detailed description…
-5. Write descriptions as if you're watching the video in real-time,
-   noting everything visible and audible.
-"""
-            response = self.gemini_model.generate_content(prompt)
-            if response and response.text:
-                scenes = []
-                lines = response.text.split("\n")
-                current_scene = ""
-                for line in lines:
-                    line = line.strip()
-                    if line.startswith("**[") and "]**:" in line:
-                        if current_scene:
-                            scenes.append(current_scene.strip())
-                        current_scene = line
-                    elif current_scene:
-                        current_scene += "\n" + line
-                if current_scene:
-                    scenes.append(current_scene.strip())
-                return (
-                    scenes if scenes else self.generate_scene_breakdown_fallback(video_info)
-                )
-            return self.generate_scene_breakdown_fallback(video_info)
-        except Exception as e:
-            print(f"Gemini API error: {e}")
-            return self.generate_scene_breakdown_fallback(video_info)
-    # ---------------------------------------------------------
-    # Fallback 장면 분석
-    # ---------------------------------------------------------
-    def generate_scene_breakdown_fallback(self, video_info):
-        duration = video_info.get("duration", 0)
-        title = video_info.get("title", "").lower()
-        description = video_info.get("description", "").lower()
-        uploader = video_info.get("uploader", "Content creator")
-        if not duration:
-            return ["**[Duration Unknown]**: Unable to generate timestamped breakdown"]
-        if duration <= 60:
-            segment_length = 3
-        elif duration <= 300:
-            segment_length = 5
-        elif duration <= 900:
-            segment_length = 10
-        else:
-            segment_length = 15
-        scenes = []
-        num_segments = min(duration // segment_length + 1, 20)
-        video_type = self.detect_video_type_detailed(title, description)
-        for i in range(num_segments):
-            start_time = i * segment_length
-            end_time = min(start_time + segment_length - 1, duration)
-            start_fmt = f"{start_time//60}:{start_time%60:02d}"
-            end_fmt = f"{end_time//60}:{end_time%60:02d}"
-            desc = self.generate_contextual_description(
-                i, num_segments, video_type, uploader, title
-            )
-            scenes.append(f"**[{start_fmt}-{end_fmt}]**: {desc}")
-        return scenes
-    # ---------------------------------------------------------
-    # 비디오 유형 감지(상세)
-    # ---------------------------------------------------------
-    def detect_video_type_detailed(self, title, description):
-        text = (title + " " + description).lower()
-        if any(w in text for w in ["tutorial", "how to", "guide", "learn", "diy"]):
-            return "tutorial"
-        if any(w in text for w in ["review", "unboxing", "test", "comparison", "vs"]):
-            return "review"
-        if any(w in text for w in ["vlog", "daily", "routine", "day in"]):
-            return "vlog"
-        if any(w in text for w in ["music", "song", "cover", "lyrics"]):
-            return "music"
-        if any(w in text for w in ["comedy", "funny", "prank", "challenge"]):
-            return "entertainment"
-        if any(w in text for w in ["news", "breaking", "update", "report"]):
-            return "news"
-        if any(w in text for w in ["cooking", "recipe", "food", "kitchen"]):
-            return "cooking"
-        if any(w in text for w in ["workout", "fitness", "exercise", "yoga"]):
-            return "fitness"
-        return "general"
-    # ---------------------------------------------------------
-    # 장면별 설명 생성
-    # ---------------------------------------------------------
-    def generate_contextual_description(
-        self, scene_index, total_scenes, video_type, uploader, title
-    ):
-        presenter_desc = "The content creator"
-        if "woman" in title or "girl" in title:
-            presenter_desc = "A woman"
-        elif "man" in title or "guy" in title:
-            presenter_desc = "A man"
-        if scene_index == 0:
-            if video_type == "tutorial":
-                return (
-                    f"{presenter_desc} appears on screen, introducing themselves and the "
-                    f"topic. They are in a well-lit workspace, wearing casual clothes."
-                )
-            if video_type == "vlog":
-                return (
-                    f"{presenter_desc} greets the camera cheerfully, perhaps waving, and "
-                    f"explains what today's vlog is about."
-                )
-            if video_type == "review":
-                return (
-                    f"{presenter_desc} holds up the product to be reviewed, giving a brief "
-                    f"overview of its features."
-                )
-            return (
-                f"{presenter_desc} starts the video with an engaging introduction to "
-                f"capture viewers' attention."
-            )
-        if scene_index == total_scenes - 1:
-            if video_type == "tutorial":
-                return (
-                    f"{presenter_desc} shows the final result, thanks viewers, and "
-                    f"encourages them to like and subscribe."
-                )
-            if video_type == "vlog":
-                return (
-                    f"{presenter_desc} wraps up the day, sharing final thoughts and "
-                    f"bidding farewell."
-                )
-            return (
-                f"{presenter_desc} concludes, summarizing key points and prompting "
-                f"engagement through likes and comments."
-            )
-        if video_type == "tutorial":
-            return (
-                f"{presenter_desc} demonstrates the next step, providing clear "
-                f"instructions with close-up shots."
-            )
-        if video_type == "review":
-            return (
-                f"{presenter_desc} examines a specific feature of the product, showing "
-                f"it in use and commenting on performance."
-            )
-        if video_type == "vlog":
-            return (
-                f"{presenter_desc} continues the day's activities, sharing candid "
-                f"moments and personal reflections."
-            )
-        if video_type == "cooking":
-            return (
-                f"{presenter_desc} prepares ingredients, chopping and mixing while "
-                f"explaining each step."
-            )
-        if video_type == "fitness":
-            return (
-                f"{presenter_desc} performs an exercise set, demonstrating proper form "
-                f"and offering tips."
-            )
-        return (
-            f"{presenter_desc} proceeds with the main content, engaging viewers through "
-            f"clear explanations."
-        )
-    # ---------------------------------------------------------
-    # 비디오 유형 (간략)
-    # ---------------------------------------------------------
-    def detect_video_type(self, title, description):
-        text = (title + " " + description).lower()
-        if any(w in text for w in ["music", "song", "album", "artist", "band", "lyrics"]):
-            return "🎵 Music Video"
-        if any(w in text for w in ["tutorial", "how to", "guide", "learn"]):
-            return "📚 Tutorial/Educational"
-        if any(w in text for w in ["funny", "comedy", "entertainment", "vlog"]):
-            return "🎭 Entertainment/Comedy"
-        if any(w in text for w in ["news", "breaking", "report", "update"]):
-            return "📰 News/Information"
-        if any(w in text for w in ["review", "unboxing", "test", "comparison"]):
-            return "⭐ Review/Unboxing"
-        if any(w in text for w in ["commercial", "ad", "brand", "product"]):
-            return "📺 Commercial/Advertisement"
-        return "🎬 General Content"
-    # ---------------------------------------------------------
-    # 배경 음악 추정
-    # ---------------------------------------------------------
-    def detect_background_music(self, video_info):
-        title = video_info.get("title", "").lower()
-        if "music" in title or "song" in title:
-            return "🎵 Original Music/Soundtrack"
-        if "commercial" in title or "ad" in title:
-            return "🎶 Upbeat Commercial Music"
-        if "tutorial" in title or "how to" in title:
-            return "🔇 Minimal/No Background Music"
-        if "vlog" in title or "daily" in title:
-            return "🎼 Ambient Background Music"
-        return "🎵 Background Music"
-    # ---------------------------------------------------------
-    # 인플루언서 규모 추정
-    # ---------------------------------------------------------
-    def detect_influencer_status(self, video_info):
-        subs = video_info.get("channel_followers", 0)
-        views = video_info.get("view_count", 0)
-        if subs > 10_000_000:
-            return "🌟 Mega Influencer (10M+)"
-        if subs > 1_000_000:
-            return "⭐ Major Influencer (1M+)"
-        if subs > 100_000:
-            return "🎯 Mid-tier Influencer (100K+)"
-        if subs > 10_000:
-            return "📈 Micro Influencer (10K+)"
-        if views > 100_000:
-            return "🔥 Viral Content Creator"
-        return "👤 Regular Content Creator"
-    # ---------------------------------------------------------
-    # 숫자 포맷터
-    # ---------------------------------------------------------
-    def format_number(self, num):
-        if not num:
-            return "0"
-        if num >= 1_000_000_000:
-            return f"{num/1_000_000_000:.1f}B"
-        if num >= 1_000_000:
-            return f"{num/1_000_000:.1f}M"
-        if num >= 1_000:
-            return f"{num/1_000:.1f}K"
-        return str(num)
-    # ---------------------------------------------------------
-    # 최종 리포트 생성
-    # ---------------------------------------------------------
-    def format_video_info(self, video_info):
-        if not video_info:
-            return "❌ No video information available."
-        title = video_info.get("title", "Unknown")
-        uploader = video_info.get("uploader", "Unknown")
-        duration = video_info.get("duration", 0)
-        dur_str = f"{duration//60}:{duration%60:02d}" if duration else "Unknown"
-        views = video_info.get("view_count", 0)
-        likes = video_info.get("like_count", 0)
-        comments = video_info.get("comment_count", 0)
-        upload_date = video_info.get("upload_date", "Unknown")
-        if len(upload_date) == 8:
-            upload_date = f"{upload_date[:4]}-{upload_date[4:6]}-{upload_date[6:8]}"
-        scenes = self.generate_scene_breakdown_gemini(video_info)
-        vtype = self.detect_video_type(title, video_info.get("description", ""))
-        bgm = self.detect_background_music(video_info)
-        creator = self.detect_influencer_status(video_info)
-        engagement = (likes / views) * 100 if views else 0
-        report = f"""
-🎬 YOUTUBE VIDEO ANALYSIS REPORT
-{'='*50}
-📋 BASIC INFORMATION
-{'─'*25}
-📹 **Title:** {title}
-👤 **Uploader:** {uploader}
-📅 **Upload Date:** {upload_date}
-⏱️ **Duration:** {dur_str}
-🆔 **Video ID:** {video_info.get('id', 'Unknown')}
-📊 PERFORMANCE METRICS
-{'─'*25}
-👀 **Views:** {self.format_number(views)} ({views:,})
-👍 **Likes:** {self.format_number(likes)} ({likes:,})
-💬 **Comments:** {self.format_number(comments)} ({comments:,})
-📈 **Engagement Rate:** {engagement:.2f}%
-🎯 CONTENT ANALYSIS
-{'─'*25}
-📂 **Video Type:** {vtype}
-🎵 **Background Music:** {bgm}
-👑 **Creator Status:** {creator}
-🎬 DETAILED SCENE BREAKDOWN
-{'─'*30}
-{chr(10).join(scenes)}
-📝 DESCRIPTION PREVIEW
-{'─'*25}
-{video_info.get('description', 'No description available')[:500]}
-{'...(truncated)' if len(video_info.get('description', '')) > 500 else ''}
-{'='*50}
-📊 **Analysis completed:** {datetime.now().strftime('%Y-%m-%d %H:%M:%S')}
-🤖 **AI Enhancement:** {'Gemini AI' if self.gemini_model else 'Standard Analysis'}
-"""
-        return report.strip()
-    # ---------------------------------------------------------
-    # 메타데이터 추출
-    # ---------------------------------------------------------
-    def get_video_info(self, url, progress=gr.Progress(), cookiefile=None):
-        if not url or not url.strip():
-            return None, "❌ Please enter a YouTube URL"
-        if not self.is_valid_youtube_url(url):
-            return None, "❌ Invalid YouTube URL format"
-        # 쿠키 선택 순서: UI 업로드 → 기본 쿠키 → None
-        if cookiefile and os.path.exists(cookiefile):
-            cookiefile = cookiefile
-        elif DEFAULT_COOKIE_FILE.exists():
-            cookiefile = str(DEFAULT_COOKIE_FILE)
-        else:
-            cookiefile = None
-        try:
-            progress(0.1, desc="Initializing YouTube extractor…")
-            ydl_opts = {"noplaylist": True, "extract_flat": False}
-            if cookiefile:
-                ydl_opts["cookiefile"] = cookiefile
-            progress(0.5, desc="Extracting video metadata…")
-            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-                info = ydl.extract_info(url, download=False)
-            progress(1.0, desc="✅ Analysis complete!")
-            return info, "✅ Video information extracted successfully"
-        except Exception as e:
-            return None, f"❌ Error: {e}"
-    # ---------------------------------------------------------
-    # 다운로드
-    # ---------------------------------------------------------
-    def download_video(
-        self,
-        url,
-        quality="best",
-        audio_only=False,
-        progress=gr.Progress(),
-        cookiefile=None,
-    ):
-        if not url or not url.strip():
-            return None, "❌ Please enter a YouTube URL"
-        if not self.is_valid_youtube_url(url):
-            return None, "❌ Invalid YouTube URL format"
-        # 쿠키 선택 순서
-        if cookiefile and os.path.exists(cookiefile):
-            cookiefile = cookiefile
-        elif DEFAULT_COOKIE_FILE.exists():
-            cookiefile = str(DEFAULT_COOKIE_FILE)
-        else:
-            cookiefile = None
-        try:
-            progress(0.1, desc="Preparing download…")
-            timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
-            ydl_opts = {
-                "outtmpl": os.path.join(
-                    self.temp_downloads, f"%(title)s_{timestamp}.%(ext)s"
-                ),
-                "noplaylist": True,
-            }
-            if audio_only:
-                ydl_opts["format"] = "bestaudio/best"
-                ydl_opts["postprocessors"] = [
-                    {
-                        "key": "FFmpegExtractAudio",
-                        "preferredcodec": "mp3",
-                        "preferredquality": "192",
-                    }
-                ]
-            else:
-                if quality == "720p":
-                    ydl_opts["format"] = "best[height<=720]"
-                elif quality == "480p":
-                    ydl_opts["format"] = "best[height<=480]"
-                else:  # "best"
-                    ydl_opts["format"] = "best[height<=1080]"
-            if cookiefile:
-                ydl_opts["cookiefile"] = cookiefile
-            # 진행률 훅
-            def hook(d):
-                if d["status"] == "downloading":
-                    if "total_bytes" in d:
-                        pct = d["downloaded_bytes"] / d["total_bytes"] * 100
-                        progress(0.1 + pct / 100 * 0.7, desc=f"Downloading… {pct:.1f}%")
-                    else:
-                        progress(0.5, desc="Downloading…")
-                elif d["status"] == "finished":
-                    progress(0.8, desc="Processing download…")
-            ydl_opts["progress_hooks"] = [hook]
-            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-                ydl.extract_info(url, download=True)
-            progress(0.9, desc="Copying to Downloads folder…")
-            # temp 디렉터리에서 파일 찾기
-            downloaded_temp = None
-            for f in os.listdir(self.temp_downloads):
-                if timestamp in f:
-                    downloaded_temp = os.path.join(self.temp_downloads, f)
-                    break
-            if not downloaded_temp:
-                return None, "❌ Downloaded file not found"
-            final_name = os.path.basename(downloaded_temp)
-            final_path = os.path.join(self.downloads_folder, final_name)
-            try:
-                shutil.copy2(downloaded_temp, final_path)
-                saved = True
-            except Exception as e:
-                print(f"Copy warning: {e}")
-                saved = False
-                final_path = "File kept only in temp folder"
-            progress(1.0, desc="✅ Download complete!")
-            msg = (
-                "✅ Download successful!\n"
-                f"📁 Temp file: {os.path.basename(downloaded_temp)}\n"
-                f"📁 Saved to: {final_path if saved else 'Copy failed'}\n"
-                f"🎯 Size: {os.path.getsize(downloaded_temp)/(1024*1024):.1f} MB"
-            )
-            return downloaded_temp, msg
-        except Exception as e:
-            return None, f"❌ Download failed: {e}"
-# =================================================================
-# Helper functions for Gradio
-# =================================================================
-downloader = YouTubeDownloader()
-def configure_api_key(api_key):
-    if not api_key or not api_key.strip():
-        return "❌ Please enter a valid Google API key", gr.update(visible=False)
-    ok, msg = downloader.configure_gemini(api_key.strip())
-    return msg, gr.update(visible=ok)
-def analyze_with_cookies(url, cookies_file, progress=gr.Progress()):
-    try:
-        progress(0.05, desc="Starting analysis…")
-        cookiefile = cookies_file if cookies_file else None
-        info, msg = downloader.get_video_info(
-            url, progress=progress, cookiefile=cookiefile
-        )
-        if info:
-            progress(0.95, desc="Generating report…")
-            return downloader.format_video_info(info)
-        return f"❌ Analysis Failed: {msg}"
-    except Exception as e:
-        return f"❌ System Error: {e}"
-def download_with_cookies(url, quality, audio_only, cookies_file, progress=gr.Progress()):
-    try:
-        progress(0.05, desc="Preparing download…")
-        cookiefile = cookies_file if cookies_file else None
-        file_path, status = downloader.download_video(
-            url, quality, audio_only, progress=progress, cookiefile=cookiefile
-        )
-        return (file_path, status) if file_path else (None, status)
-    except Exception as e:
-        return None, f"❌ System Error: {e}"
-# =================================================================
-# Gradio UI
-# =================================================================
-#!/usr/bin/env python3
-"""
-YouTube Video Analyzer & Downloader Pro
-───────────────────────────────────────
-•  `www.youtube.com_cookies.txt` 가 app.py 와 같은 폴더에 있으면 자동으로 사용
-•  UI에서 쿠키를 업로드하면 그 파일이 *우선* 적용
-•  “Transcript” 탭을 추가해 **전체 자막 + MM:SS 타임스탬프** 출력
-"""
-# ── 표준 라이브러리 ───────────────────────────────────────────
-import os, re, json, shutil, tempfile
-from datetime import datetime, timedelta
-from pathlib import Path
-# ── 서드파티 ──────────────────────────────────────────────────
-import gradio as gr
-import yt_dlp
-import google.generativeai as genai
-from youtube_transcript_api import YouTubeTranscriptApi  # NEW
-# ── 상수 ──────────────────────────────────────────────────────
-DEFAULT_COOKIE_FILE = Path(__file__).with_name("www.youtube.com_cookies.txt")
-# YouTube URL 정규식(캡처 그룹 6이 영상 ID)
-_YT_REGEX = re.compile(
-    r"(https?://)?(www\.)?"
-    r"(youtube|youtu|youtube-nocookie)\.(com|be)/"
-    r"(watch\?v=|embed/|v/|.+\?v=)?([^&=%\?]{11})"
-)
-# =================================================================
-# Helper :  video-ID 추출 + 자막 가져오기
-# =================================================================
-def extract_video_id(url: str) -> str | None:
-    """유튜브 URL에서 11-글자 비디오 ID 반환(없으면 None)"""
-    m = _YT_REGEX.match(url)
-    return m.group(6) if m else None
-def fetch_transcript(video_id: str, pref_lang=("ko", "en")) -> str:
-    """
-    유튜브 자막을 가져와
-    **[MM:SS]** line 형식으로 결합한 뒤 문자열로 반환.
-    """
-    transcript = None
-    # 언어 우선순위대로 시도
-    for lang in pref_lang:
-        try:
-            transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=[lang])
-            break
-        except Exception:
-            continue
-    # 그래도 실패하면 임의 언어
-    if transcript is None:
-        transcript = YouTubeTranscriptApi.get_transcript(video_id)
-    lines = []
-    for seg in transcript:
-        t = str(timedelta(seconds=int(seg["start"])))       # H:MM:SS
-        t_mmss = ":".join(t.split(":")[-2:])                # MM:SS
-        lines.append(f"**[{t_mmss}]** {seg['text']}")
-    return "\n".join(lines)
-# =================================================================
-# 메인 클래스
-# =================================================================
-class YouTubeDownloader:
-    def __init__(self):
-        self.download_dir = tempfile.mkdtemp()
-        self.temp_downloads = tempfile.mkdtemp(prefix="youtube_downloads_")
-        self.downloads_folder = os.path.join(
-            os.path.expanduser("~"), "Downloads", "YouTube_Downloads"
-        )
-        os.makedirs(self.downloads_folder, exist_ok=True)
-        self.gemini_model = None
-    # ───────── Gemini ─────────
-    def configure_gemini(self, api_key):
-        try:
-            genai.configure(api_key=api_key)
-            self.gemini_model = genai.GenerativeModel(
-                model_name="gemini-1.5-flash-latest"
-            )
-            return True, "✅ Gemini API configured successfully!"
-        except Exception as e:
-            return False, f"❌ Failed to configure Gemini API: {e}"
-    # ───────── 정리 ────���────
-    def cleanup(self):
-        try:
-            if os.path.exists(self.download_dir):
-                shutil.rmtree(self.download_dir)
-            if os.path.exists(self.temp_downloads):
-                shutil.rmtree(self.temp_downloads)
-        except Exception:
-            pass
-    # ───────── URL 검증 ──────
-    def is_valid_youtube_url(self, url):
-        return _YT_REGEX.match(url) is not None
-    # ───────── Gemini scene breakdown (생략 없이 전체 구현) ──────
-    def generate_scene_breakdown_gemini(self, video_info):
-        if not self.gemini_model:
-            return self.generate_scene_breakdown_fallback(video_info)
-        try:
-            duration = video_info.get("duration", 0)
-            title = video_info.get("title", "")
-            description = video_info.get("description", "")[:1500]
-            if not duration:
-                return [
-                    "**[Duration Unknown]**: Unable to generate timestamped breakdown – "
-                    "video duration not available"
-                ]
-            prompt = f"""
-Analyze this YouTube video and create a highly detailed, scene-by-scene breakdown
-with precise timestamps and specific descriptions:
-Title: {title}
-Duration: {duration} seconds
-Description: {description}
-IMPORTANT INSTRUCTIONS:
-1. Create detailed scene descriptions that include:
-   - Physical appearance of people (age, gender, clothing, hair, etc.)
-   - Exact actions being performed
-   - Dialogue or speech (include actual lines if audible, or infer probable spoken
-     lines based on actions and setting; format them as "Character: line…")
-   - Setting and environment details
-   - Props, objects, or products being shown
-   - Visual effects, text overlays, or graphics
-   - Mood, tone, and atmosphere
-   - Camera movements or angles (if apparent)
-2. Dialogue Emphasis:
-   - Include short dialogue lines in **every scene** wherever plausible.
-   - Write lines like: Character: "Actual or inferred line…"
-   - If dialogue is not available, intelligently infer probable phrases
-3. Timestamp Guidelines:
-   - <1 min : 2–3 s | 1–5 min : 3–5 s | 5–15 min : 5–10 s | >15 min : 10–15 s
-   - Max 20 scenes
-4. Format: **[MM:SS-MM:SS]** description
-"""
-            resp = self.gemini_model.generate_content(prompt)
-            if not resp or not resp.text:
-                return self.generate_scene_breakdown_fallback(video_info)
-            scenes, cur = [], ""
-            for line in resp.text.splitlines():
-                line = line.strip()
-                if line.startswith("**[") and "]**:" in line:
-                    if cur:
-                        scenes.append(cur.strip())
-                    cur = line
-                elif cur:
-                    cur += "\n" + line
-            if cur:
-                scenes.append(cur.strip())
-            return scenes if scenes else self.generate_scene_breakdown_fallback(video_info)
-        except Exception:
-            return self.generate_scene_breakdown_fallback(video_info)
-    # ───────── fallback breakdown ──────
-    def generate_scene_breakdown_fallback(self, video_info):
-        duration = video_info.get("duration", 0)
-        if not duration:
-            return ["**[Duration Unknown]**: Unable to generate timestamped breakdown"]
-        if duration <= 60:
-            seg = 3
-        elif duration <= 300:
-            seg = 5
-        elif duration <= 900:
-            seg = 10
-        else:
-            seg = 15
-        total = min(duration // seg + 1, 20)
-        vtype = self.detect_video_type_detailed(
-            video_info.get("title", ""), video_info.get("description", "")
-        )
-        scenes = []
-        for i in range(total):
-            s, e = i * seg, min(i * seg + seg - 1, duration)
-            scenes.append(
-                f"**[{s//60:02d}:{s%60:02d}-{e//60:02d}:{e%60:02d}]**: "
-                f"{self.generate_contextual_description(i, total, vtype, '', video_info.get('title',''))}"
-            )
-        return scenes
-    # ───────── detect helpers (상세) ──────
-    def detect_video_type_detailed(self, title, desc):
-        t = (title + " " + desc).lower()
-        if any(x in t for x in ["tutorial", "how to", "guide", "diy"]):
-            return "tutorial"
-        if any(x in t for x in ["review", "unboxing", "comparison"]):
-            return "review"
-        if any(x in t for x in ["vlog", "daily", "routine"]):
-            return "vlog"
-        if any(x in t for x in ["music", "song", "cover"]):
-            return "music"
-        if any(x in t for x in ["comedy", "prank", "challenge"]):
-            return "entertainment"
-        if any(x in t for x in ["news", "update", "report"]):
-            return "news"
-        if any(x in t for x in ["cooking", "recipe", "food"]):
-            return "cooking"
-        if any(x in t for x in ["workout", "fitness", "yoga"]):
-            return "fitness"
-        return "general"
-    def generate_contextual_description(
-        self, idx, total, vtype, uploader, title
-    ):
-        if idx == 0:
-            return "The creator greets viewers and introduces the video."
-        if idx == total - 1:
-            return "The creator wraps up and thanks viewers."
-        return "Content continues according to the video type."
-    # ───────── quick-detect helpers (요약) ──────
-    def detect_video_type(self, title, desc):
-        t = (title + " " + desc).lower()
-        if any(x in t for x in ["music", "song", "album"]):
-            return "🎵 Music"
-        if any(x in t for x in ["tutorial", "guide"]):
-            return "📚 Tutorial"
-        if any(x in t for x in ["comedy", "vlog"]):
-            return "🎭 Entertainment"
-        if any(x in t for x in ["news", "report"]):
-            return "📰 News"
-        if any(x in t for x in ["review", "unboxing"]):
-            return "⭐ Review"
-        return "🎬 General"
-    def detect_background_music(self, video_info):
-        title = video_info.get("title", "").lower()
-        if "music" in title:
-            return "🎵 Original music"
-        if "tutorial" in title:
-            return "🔇 Minimal music"
-        return "🎼 Background music"
-    def detect_influencer_status(self, video_info):
-        subs = video_info.get("channel_followers", 0)
-        if subs > 10_000_000:
-            return "🌟 Mega (10 M+)"
-        if subs > 1_000_000:
-            return "⭐ Major (1 M+)"
-        if subs > 100_000:
-            return "🎯 Mid (100 K+)"
-        return "👤"
-    @staticmethod
-    def format_number(n):
-        if n >= 1_000_000:
-            return f"{n/1_000_000:.1f} M"
-        if n >= 1_000:
-            return f"{n/1_000:.1f} K"
-        return str(n)
-    # ───────── 리포트 ──────
-    def format_video_info(self, info):
-        title = info.get("title", "")
-        uploader = info.get("uploader", "")
-        duration = info.get("duration", 0)
-        dur = f"{duration//60}:{duration%60:02d}"
-        views = info.get("view_count", 0)
-        likes = info.get("like_count", 0)
-        comments = info.get("comment_count", 0)
-        scenes = self.generate_scene_breakdown_gemini(info)
-        return f"""
-🎬 **{title}**
-Uploader: {uploader} Duration: {dur}
-Views / Likes / Comments: {self.format_number(views)} / {self.format_number(likes)} / {self.format_number(comments)}
-{'-'*48}
-{"".join(scenes)}
-"""
-    # ───────── 메타데이터 추출 ──────
-    def get_video_info(self, url, progress=gr.Progress(), cookiefile=None):
-        if not self.is_valid_youtube_url(url):
-            return None, "❌ Invalid URL"
-        if cookiefile and os.path.exists(cookiefile):
-            cookiefile = cookiefile
-        elif DEFAULT_COOKIE_FILE.exists():
-            cookiefile = str(DEFAULT_COOKIE_FILE)
-        else:
-            cookiefile = None
-        try:
-            ydl_opts = {"noplaylist": True, "quiet": True}
-            if cookiefile:
-                ydl_opts["cookiefile"] = cookiefile
-            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-                info = ydl.extract_info(url, download=False)
-            return info, "OK"
-        except Exception as e:
-            return None, f"yt-dlp error: {e}"
-    # ───────── 다운로드 ──────
-    def download_video(
-        self, url, quality="best", audio_only=False, progress=gr.Progress(), cookiefile=None
-    ):
-        if not self.is_valid_youtube_url(url):
-            return None, "❌ Invalid URL"
-        if cookiefile and os.path.exists(cookiefile):
-            cookiefile = cookiefile
-        elif DEFAULT_COOKIE_FILE.exists():
-            cookiefile = str(DEFAULT_COOKIE_FILE)
-        else:
-            cookiefile = None
-        ts = datetime.now().strftime("%Y%m%d_%H%M%S")
-        ydl_opts = {
-            "outtmpl": os.path.join(self.temp_downloads, f"%(title)s_{ts}.%(ext)s"),
-            "noplaylist": True,
-        }
-        if audio_only:
-            ydl_opts["format"] = "bestaudio/best"
-            ydl_opts["postprocessors"] = [
-                {"key": "FFmpegExtractAudio", "preferredcodec": "mp3", "preferredquality": "192"}
-            ]
-        else:
-            if quality == "720p":
-                ydl_opts["format"] = "best[height<=720]"
-            elif quality == "480p":
-                ydl_opts["format"] = "best[height<=480]"
-            else:
-                ydl_opts["format"] = "best[height<=1080]"
-        if cookiefile:
-            ydl_opts["cookiefile"] = cookiefile
-        try:
-            with yt_dlp.YoutubeDL(ydl_opts) as ydl:
-                ydl.extract_info(url, download=True)
-            # 첫 파일 찾기
-            for f in os.listdir(self.temp_downloads):
-                if ts in f:
-                    temp_fp = os.path.join(self.temp_downloads, f)
-                    final_fp = os.path.join(self.downloads_folder, f)
-                    try:
-                        shutil.copy2(temp_fp, final_fp)
-                        saved = final_fp
-                    except Exception:
-                        saved = temp_fp
-                    return temp_fp, f"✅ Saved: {saved}"
-            return None, "❌ Downloaded file not found"
-        except Exception as e:
-            return None, f"❌ Download failed: {e}"
-# =================================================================
-# Gradio Helper 함수
-# =================================================================
-downloader = YouTubeDownloader()
-def configure_api_key(api_key):
-    ok, msg = downloader.configure_gemini(api_key.strip()) if api_key else (False, "❌ API key required")
-    return msg, gr.update(visible=ok)
-def analyze_with_cookies(url, cookies_file, progress=gr.Progress()):
-    info, err = downloader.get_video_info(url, progress, cookies_file)
-    return downloader.format_video_info(info) if info else f"❌ {err}"
-def download_with_cookies(url, qual, audio, cookies_file, progress=gr.Progress()):
-    fp, msg = downloader.download_video(url, qual, audio, progress, cookies_file)
-    return fp, msg
-def get_transcript(url, cookies_file):
-    vid = extract_video_id(url)
-    if not vid:
-        return "❌ Invalid YouTube URL"
-    try:
-        return fetch_transcript(vid)
-    except Exception as e:
-        return f"❌ {e}"
-# =================================================================
-# UI
-# =================================================================
-def create_interface():
-    with gr.Blocks(
-        theme=gr.themes.Soft(), title="🎥 YouTube Video Analyzer & Downloader Pro"
-    ) as iface:
-        gr.HTML("<h1>🎥 YouTube Video Analyzer & Downloader Pro</h1>")
-        # API 설정
-        with gr.Group():
-            gr.HTML("<h3>🔑 Google Gemini API Configuration</h3>")
-            with gr.Row():
-                api_key_in = gr.Textbox(
-                    label="🔑 Google API Key", type="password", placeholder="Paste your Google API key…"
-                )
-                api_btn = gr.Button("🔧 Configure API", variant="secondary")
-            api_status = gr.Textbox(
-                label="API Status",
-                value="❌ Gemini API not configured – Using fallback analysis",
-                interactive=False,
-                lines=1,
-            )
-        # 공통 입력
-        with gr.Row():
-            url_in = gr.Textbox(label="🔗 YouTube URL", placeholder="Paste YouTube video URL…")
-            cookies_in = gr.File(
-                label="🍪 Upload cookies.txt (optional)", file_types=[".txt"], type="filepath"
-            )
-        with gr.Tabs():
-            # 분석 탭
-            with gr.TabItem("📊 Video Analysis"):
-                analyze_btn = gr.Button("🔍 Analyze Video", variant="primary")
-                analysis_out = gr.Textbox(label="📊 Analysis Report", lines=30, show_copy_button=True)
-                analyze_btn.click(
-                    analyze_with_cookies, inputs=[url_in, cookies_in], outputs=analysis_out, show_progress=True
-                )
-            # 다운로드 탭
-            with gr.TabItem("⬇️ Video Download"):
-                with gr.Row():
-                    quality_dd = gr.Dropdown(
-                        choices=["best", "720p", "480p"], value="best", label="📺 Quality"
-                    )
-                    audio_cb = gr.Checkbox(label="🎵 Audio only (MP3)")
-                download_btn = gr.Button("⬇️ Download Video", variant="primary")
-                dl_status = gr.Textbox(label="📥 Download Status", lines=5, show_copy_button=True)
-                dl_file = gr.File(label="📁 Downloaded File", visible=False)
-                def wrapped_dl(u, q, a, c, prog=gr.Progress()):
-                    fp, st = download_with_cookies(u, q, a, c, prog)
-                    return (st, gr.update(value=fp, visible=True)) if fp and os.path.exists(fp) else (
-                        st,
-                        gr.update(visible=False),
-                    )
-                download_btn.click(
-                    wrapped_dl,
-                    inputs=[url_in, quality_dd, audio_cb, cookies_in],
-                    outputs=[dl_status, dl_file],
-                    show_progress=True,
-                )
-            # 자막 탭  NEW
-            with gr.TabItem("🗒️ Transcript"):
-                tr_btn = gr.Button("📜 Get Full Transcript", variant="primary")
-                tr_out = gr.Textbox(
-                    label="🗒️ Transcript (full)", lines=30, show_copy_button=True
-                )
-                tr_btn.click(
-                    get_transcript, inputs=[url_in, cookies_in], outputs=tr_out, show_progress=True
-                )
-        # API 버튼
-        api_btn.click(configure_api_key, inputs=[api_key_in], outputs=[api_status])
-        gr.HTML(
-            """
-<div style="margin-top:20px;padding:15px;background:#f0f8ff;border-left:5px solid #4285f4;border-radius:10px;">
-  <h3>💡 Tip: 쿠키 파일 자동 사용</h3>
-  <p><code>www.youtube.com_cookies.txt</code> 파일을 <strong>app.py</strong>와 같은
-  폴더에 두면 업로드 없이 자동 사용됩니다.</p>
-</div>
-"""
-        )
-    return iface
-# =================================================================
-# 실행
-# =================================================================
-if __name__ == "__main__":
-    demo = create_interface()
-    import atexit
-    atexit.register(downloader.cleanup)
-    demo.launch(debug=True, show_error=True)
-#!/usr/bin/env python3
-"""
-YouTube Video Analyzer & Downloader Pro
 ───────────────────────────────────────
 •  `www.youtube.com_cookies.txt` 가 app.py 와 같은 폴더에 있으면 자동으로 사용
 •  UI에서 쿠키를 업로드하면 그 파일이 *우선* 적용

 #!/usr/bin/env python3
 """
 YouTube Video Analyzer & Downloader Pro
 ───────────────────────────────────────
 •  `www.youtube.com_cookies.txt` 가 app.py 와 같은 폴더에 있으면 자동으로 사용
 •  UI에서 쿠키를 업로드하면 그 파일이 *우선* 적용