123456789101112131415161718192021222324 |
- from langchain.document_loaders import YoutubeLoader
- from embedchain.utils import clean_string
- class YoutubeVideoLoader:
- def load_data(self, url):
- """Load data from a Youtube video."""
- loader = YoutubeLoader.from_youtube_url(url, add_video_info=True)
- doc = loader.load()
- output = []
- if not len(doc):
- raise ValueError("No data found")
- content = doc[0].page_content
- content = clean_string(content)
- meta_data = doc[0].metadata
- meta_data["url"] = url
- output.append(
- {
- "content": content,
- "meta_data": meta_data,
- }
- )
- return output
|