123456789101112131415161718192021222324252627282930313233343536 |
- import os
- from typing import Optional
- from chromadb.utils.embedding_functions import OpenAIEmbeddingFunction
- from langchain_community.embeddings import AzureOpenAIEmbeddings
- from embedchain.config import BaseEmbedderConfig
- from embedchain.embedder.base import BaseEmbedder
- from embedchain.models import VectorDimensions
- class OpenAIEmbedder(BaseEmbedder):
- def __init__(self, config: Optional[BaseEmbedderConfig] = None):
- super().__init__(config=config)
- if self.config.model is None:
- self.config.model = "text-embedding-ada-002"
- api_key = self.config.api_key or os.environ["OPENAI_API_KEY"]
- if self.config.deployment_name:
- embeddings = AzureOpenAIEmbeddings(deployment=self.config.deployment_name)
- embedding_fn = BaseEmbedder._langchain_default_concept(embeddings)
- else:
- if api_key is None and os.getenv("OPENAI_ORGANIZATION") is None:
- raise ValueError(
- "OPENAI_API_KEY or OPENAI_ORGANIZATION environment variables not provided"
- ) # noqa:E501
- embedding_fn = OpenAIEmbeddingFunction(
- api_key=api_key,
- organization_id=os.getenv("OPENAI_ORGANIZATION"),
- model_name=self.config.model,
- )
- self.set_embedding_fn(embedding_fn=embedding_fn)
- vector_dimension = self.config.vector_dimension or VectorDimensions.OPENAI.value
- self.set_vector_dimension(vector_dimension=vector_dimension)
|