chroma_db.py 866 B

123456789101112131415161718192021222324252627282930
  1. import chromadb
  2. import os
  3. from chromadb.utils import embedding_functions
  4. from embedchain.vectordb.base_vector_db import BaseVectorDB
  5. openai_ef = embedding_functions.OpenAIEmbeddingFunction(
  6. api_key=os.getenv("OPENAI_API_KEY"),
  7. model_name="text-embedding-ada-002"
  8. )
  9. class ChromaDB(BaseVectorDB):
  10. def __init__(self, db_dir=None):
  11. if db_dir is None:
  12. db_dir = "db"
  13. self.client_settings = chromadb.config.Settings(
  14. chroma_db_impl="duckdb+parquet",
  15. persist_directory=db_dir,
  16. anonymized_telemetry=False
  17. )
  18. super().__init__()
  19. def _get_or_create_db(self):
  20. return chromadb.Client(self.client_settings)
  21. def _get_or_create_collection(self):
  22. return self.client.get_or_create_collection(
  23. 'embedchain_store', embedding_function=openai_ef,
  24. )