InitConfig.py 2.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081
  1. import logging
  2. import os
  3. from chromadb.utils import embedding_functions
  4. from embedchain.config.BaseConfig import BaseConfig
  5. class InitConfig(BaseConfig):
  6. """
  7. Config to initialize an embedchain `App` instance.
  8. """
  9. def __init__(self, log_level=None, ef=None, db=None, host=None, port=None):
  10. """
  11. :param log_level: Optional. (String) Debug level
  12. ['DEBUG', 'INFO', 'WARNING', 'ERROR', 'CRITICAL'].
  13. :param ef: Optional. Embedding function to use.
  14. :param db: Optional. (Vector) database to use for embeddings.
  15. :param host: Optional. Hostname for the database server.
  16. :param port: Optional. Port for the database server.
  17. """
  18. self._setup_logging(log_level)
  19. self.ef = ef
  20. self.db = db
  21. self.host = host
  22. self.port = port
  23. return
  24. def _set_embedding_function(self, ef):
  25. self.ef = ef
  26. return
  27. def _set_embedding_function_to_default(self):
  28. """
  29. Sets embedding function to default (`text-embedding-ada-002`).
  30. :raises ValueError: If the template is not valid as template should contain
  31. $context and $query
  32. """
  33. if (
  34. os.getenv("OPENAI_API_KEY") is None
  35. and os.getenv("OPENAI_ORGANIZATION") is None
  36. ):
  37. raise ValueError(
  38. "OPENAI_API_KEY or OPENAI_ORGANIZATION environment variables not provided" # noqa:E501
  39. )
  40. self.ef = embedding_functions.OpenAIEmbeddingFunction(
  41. api_key=os.getenv("OPENAI_API_KEY"),
  42. organization_id=os.getenv("OPENAI_ORGANIZATION"),
  43. model_name="text-embedding-ada-002",
  44. )
  45. return
  46. def _set_db(self, db):
  47. if db:
  48. self.db = db
  49. return
  50. def _set_db_to_default(self):
  51. """
  52. Sets database to default (`ChromaDb`).
  53. """
  54. from embedchain.vectordb.chroma_db import ChromaDB
  55. self.db = ChromaDB(ef=self.ef, host=self.host, port=self.port)
  56. def _setup_logging(self, debug_level):
  57. level = logging.WARNING # Default level
  58. if debug_level is not None:
  59. level = getattr(logging, debug_level.upper(), None)
  60. if not isinstance(level, int):
  61. raise ValueError(f"Invalid log level: {debug_level}")
  62. logging.basicConfig(
  63. format="%(asctime)s [%(name)s] [%(levelname)s] %(message)s", level=level
  64. )
  65. self.logger = logging.getLogger(__name__)
  66. return