Spaces:
No application file
No application file
File size: 1,101 Bytes
d5ccf60 c4b829b d5ccf60 c4b829b d5ccf60 c4b829b |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 |
from langchain_core.tools import tool
from youtube_transcript_api import YouTubeTranscriptApi, NoTranscriptFound, TranscriptsDisabled
@tool("youtube_transcript_extractor", parse_docstring=True)
def extract_youtube_transcript(youtube_url: str) -> str:
"""Extracts the transcript from a given YouTube video URL.
Args:
youtube_url (str): The URL of the YouTube video.
Returns:
str: The transcript as a single string, or an error message if the transcript
cannot be found or an error occurs.
"""
try:
video_id = youtube_url.split("v=")[1].split("&")[0]
transcript_list = YouTubeTranscriptApi.get_transcript(video_id)
transcript = " ".join([item['text'] for item in transcript_list])
return transcript
except NoTranscriptFound:
return "Error: No transcript found for this video. It might be disabled or not available in English."
except TranscriptsDisabled:
return "Error: Transcripts are disabled for this video."
except Exception as e:
return f"Error extracting transcript: {str(e)}"
|