File size: 1,101 Bytes
d5ccf60
c4b829b
 
d5ccf60
c4b829b
d5ccf60
 
 
 
 
 
 
 
c4b829b
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
from langchain_core.tools import tool
from youtube_transcript_api import YouTubeTranscriptApi, NoTranscriptFound, TranscriptsDisabled

@tool("youtube_transcript_extractor", parse_docstring=True)
def extract_youtube_transcript(youtube_url: str) -> str:
    """Extracts the transcript from a given YouTube video URL.

    Args:
        youtube_url (str): The URL of the YouTube video.

    Returns:
        str: The transcript as a single string, or an error message if the transcript
             cannot be found or an error occurs.
    """
    try:
        video_id = youtube_url.split("v=")[1].split("&")[0]
        transcript_list = YouTubeTranscriptApi.get_transcript(video_id)
        transcript = " ".join([item['text'] for item in transcript_list])
        return transcript
    except NoTranscriptFound:
        return "Error: No transcript found for this video. It might be disabled or not available in English."
    except TranscriptsDisabled:
        return "Error: Transcripts are disabled for this video."
    except Exception as e:
        return f"Error extracting transcript: {str(e)}"