12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667 |
- import builtins
- from importlib import import_module
- from typing import Callable, Optional
- from embedchain.config.base_config import BaseConfig
- from embedchain.helper.json_serializable import register_deserializable
- @register_deserializable
- class ChunkerConfig(BaseConfig):
- """
- Config for the chunker used in `add` method
- """
- def __init__(
- self,
- chunk_size: Optional[int] = None,
- chunk_overlap: Optional[int] = None,
- length_function: Optional[Callable[[str], int]] = None,
- ):
- self.chunk_size = chunk_size if chunk_size else 2000
- self.chunk_overlap = chunk_overlap if chunk_overlap else 0
- if isinstance(length_function, str):
- self.length_function = self.load_func(length_function)
- else:
- self.length_function = length_function if length_function else len
- def load_func(self, dotpath: str):
- if "." not in dotpath:
- return getattr(builtins, dotpath)
- else:
- module_, func = dotpath.rsplit(".", maxsplit=1)
- m = import_module(module_)
- return getattr(m, func)
- @register_deserializable
- class LoaderConfig(BaseConfig):
- """
- Config for the chunker used in `add` method
- """
- def __init__(self):
- pass
- @register_deserializable
- class AddConfig(BaseConfig):
- """
- Config for the `add` method.
- """
- def __init__(
- self,
- chunker: Optional[ChunkerConfig] = None,
- loader: Optional[LoaderConfig] = None,
- ):
- """
- Initializes a configuration class instance for the `add` method.
- :param chunker: Chunker config, defaults to None
- :type chunker: Optional[ChunkerConfig], optional
- :param loader: Loader config, defaults to None
- :type loader: Optional[LoaderConfig], optional
- """
- self.loader = loader
- self.chunker = chunker
|