youtube_video.py 697 B

123456789101112131415161718192021222324
  1. from langchain.document_loaders import YoutubeLoader
  2. from embedchain.utils import clean_string
  3. class YoutubeVideoLoader:
  4. def load_data(self, url):
  5. """Load data from a Youtube video."""
  6. loader = YoutubeLoader.from_youtube_url(url, add_video_info=True)
  7. doc = loader.load()
  8. output = []
  9. if not len(doc):
  10. raise ValueError("No data found")
  11. content = doc[0].page_content
  12. content = clean_string(content)
  13. meta_data = doc[0].metadata
  14. meta_data["url"] = url
  15. output.append(
  16. {
  17. "content": content,
  18. "meta_data": meta_data,
  19. }
  20. )
  21. return output