InitConfig.py 2.8 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495
  1. import logging
  2. import os
  3. from chromadb.utils import embedding_functions
  4. from embedchain.config.BaseConfig import BaseConfig
  5. class InitConfig(BaseConfig):
  6. """
  7. Config to initialize an embedchain `App` instance.
  8. """
  9. def __init__(self, log_level=None, ef=None, db=None, host=None, port=None):
  10. """
  11. :param log_level: Optional. (String) Debug level
  12. ['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'].
  13. :param ef: Optional. Embedding function to use.
  14. :param db: Optional. (Vector) database to use for embeddings.
  15. """
  16. self._setup_logging(log_level)
  17. # Embedding Function
  18. if ef is None:
  19. from chromadb.utils import embedding_functions
  20. self.ef = embedding_functions.OpenAIEmbeddingFunction(
  21. api_key=os.getenv("OPENAI_API_KEY"),
  22. organization_id=os.getenv("OPENAI_ORGANIZATION"),
  23. model_name="text-embedding-ada-002",
  24. )
  25. else:
  26. self.ef = ef
  27. if db is None:
  28. from embedchain.vectordb.chroma_db import ChromaDB
  29. self.db = ChromaDB(ef=self.ef, host=host, port=port)
  30. else:
  31. self.db = db
  32. self.ef = ef
  33. self.db = db
  34. return
  35. def _set_embedding_function(self, ef):
  36. self.ef = ef
  37. return
  38. def _set_embedding_function_to_default(self):
  39. """
  40. Sets embedding function to default (`text-embedding-ada-002`).
  41. :raises ValueError: If the template is not valid as template should contain
  42. $context and $query
  43. """
  44. if (
  45. os.getenv("OPENAI_API_KEY") is None
  46. or os.getenv("OPENAI_ORGANIZATION") is None
  47. ):
  48. raise ValueError(
  49. "OPENAI_API_KEY or OPENAI_ORGANIZATION environment variables not provided" # noqa:E501
  50. )
  51. self.ef = embedding_functions.OpenAIEmbeddingFunction(
  52. api_key=os.getenv("OPENAI_API_KEY"),
  53. organization_id=os.getenv("OPENAI_ORGANIZATION"),
  54. model_name="text-embedding-ada-002",
  55. )
  56. return
  57. def _set_db(self, db):
  58. if db:
  59. self.db = db
  60. return
  61. def _set_db_to_default(self):
  62. """
  63. Sets database to default (`ChromaDb`).
  64. """
  65. from embedchain.vectordb.chroma_db import ChromaDB
  66. self.db = ChromaDB(ef=self.ef)
  67. def _setup_logging(self, debug_level):
  68. level = logging.WARNING # Default level
  69. if debug_level is not None:
  70. level = getattr(logging, debug_level.upper(), None)
  71. if not isinstance(level, int):
  72. raise ValueError(f"Invalid log level: {debug_level}")
  73. logging.basicConfig(
  74. format="%(asctime)s [%(name)s] [%(levelname)s] %(message)s", level=level
  75. )
  76. self.logger = logging.getLogger(__name__)
  77. return