openai.py 1.6 KB

1234567891011121314151617181920212223242526272829303132333435363738
  1. import os
  2. from typing import Optional
  3. from chromadb.utils.embedding_functions import OpenAIEmbeddingFunction
  4. from langchain_openai.embeddings import AzureOpenAIEmbeddings
  5. from embedchain.config import BaseEmbedderConfig
  6. from embedchain.embedder.base import BaseEmbedder
  7. from embedchain.models import VectorDimensions
  8. class OpenAIEmbedder(BaseEmbedder):
  9. def __init__(self, config: Optional[BaseEmbedderConfig] = None):
  10. super().__init__(config=config)
  11. if self.config.model is None:
  12. self.config.model = "text-embedding-ada-002"
  13. api_key = self.config.api_key or os.environ["OPENAI_API_KEY"]
  14. api_base = self.config.api_base or os.environ.get("OPENAI_API_BASE")
  15. if self.config.deployment_name:
  16. embeddings = AzureOpenAIEmbeddings(deployment=self.config.deployment_name)
  17. embedding_fn = BaseEmbedder._langchain_default_concept(embeddings)
  18. else:
  19. if api_key is None and os.getenv("OPENAI_ORGANIZATION") is None:
  20. raise ValueError(
  21. "OPENAI_API_KEY or OPENAI_ORGANIZATION environment variables not provided"
  22. ) # noqa:E501
  23. embedding_fn = OpenAIEmbeddingFunction(
  24. api_key=api_key,
  25. api_base=api_base,
  26. organization_id=os.getenv("OPENAI_ORGANIZATION"),
  27. model_name=self.config.model,
  28. )
  29. self.set_embedding_fn(embedding_fn=embedding_fn)
  30. vector_dimension = self.config.vector_dimension or VectorDimensions.OPENAI.value
  31. self.set_vector_dimension(vector_dimension=vector_dimension)