from langchain_core.tools import tool from youtube_transcript_api import YouTubeTranscriptApi, NoTranscriptFound, TranscriptsDisabled @tool("youtube_transcript_extractor", parse_docstring=True) def extract_youtube_transcript(youtube_url: str) -> str: """Extracts the transcript from a given YouTube video URL. Args: youtube_url (str): The URL of the YouTube video. Returns: str: The transcript as a single string, or an error message if the transcript cannot be found or an error occurs. """ try: video_id = youtube_url.split("v=")[1].split("&")[0] transcript_list = YouTubeTranscriptApi.get_transcript(video_id) transcript = " ".join([item['text'] for item in transcript_list]) return transcript except NoTranscriptFound: return "Error: No transcript found for this video. It might be disabled or not available in English." except TranscriptsDisabled: return "Error: Transcripts are disabled for this video." except Exception as e: return f"Error extracting transcript: {str(e)}"