12345678910111213141516171819202122 |
- from langchain.document_loaders import YoutubeLoader
- from embedchain.utils import clean_string
- class YoutubeVideoLoader:
- def load_data(self, url):
- loader = YoutubeLoader.from_youtube_url(url, add_video_info=True)
- doc = loader.load()
- output = []
- if not len(doc):
- raise ValueError("No data found")
- content = doc[0].page_content
- content = clean_string(content)
- meta_data = doc[0].metadata
- meta_data["url"] = url
- output.append({
- "content": content,
- "meta_data": meta_data,
- })
- return output
|