openai.py 1.5 KB

123456789101112131415161718192021222324252627282930313233343536
  1. import os
  2. from typing import Optional
  3. from chromadb.utils.embedding_functions import OpenAIEmbeddingFunction
  4. from langchain_community.embeddings import AzureOpenAIEmbeddings
  5. from embedchain.config import BaseEmbedderConfig
  6. from embedchain.embedder.base import BaseEmbedder
  7. from embedchain.models import VectorDimensions
  8. class OpenAIEmbedder(BaseEmbedder):
  9. def __init__(self, config: Optional[BaseEmbedderConfig] = None):
  10. super().__init__(config=config)
  11. if self.config.model is None:
  12. self.config.model = "text-embedding-ada-002"
  13. api_key = self.config.api_key or os.environ["OPENAI_API_KEY"]
  14. if self.config.deployment_name:
  15. embeddings = AzureOpenAIEmbeddings(deployment=self.config.deployment_name)
  16. embedding_fn = BaseEmbedder._langchain_default_concept(embeddings)
  17. else:
  18. if api_key is None and os.getenv("OPENAI_ORGANIZATION") is None:
  19. raise ValueError(
  20. "OPENAI_API_KEY or OPENAI_ORGANIZATION environment variables not provided"
  21. ) # noqa:E501
  22. embedding_fn = OpenAIEmbeddingFunction(
  23. api_key=api_key,
  24. organization_id=os.getenv("OPENAI_ORGANIZATION"),
  25. model_name=self.config.model,
  26. )
  27. self.set_embedding_fn(embedding_fn=embedding_fn)
  28. vector_dimension = self.config.vector_dimension or VectorDimensions.OPENAI.value
  29. self.set_vector_dimension(vector_dimension=vector_dimension)