groq.py 3.0 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667
  1. import os
  2. from typing import Any, Optional
  3. from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
  4. from langchain.schema import HumanMessage, SystemMessage
  5. try:
  6. from langchain_groq import ChatGroq
  7. except ImportError:
  8. raise ImportError("Groq requires extra dependencies. Install with `pip install langchain-groq`") from None
  9. from embedchain.config import BaseLlmConfig
  10. from embedchain.helpers.json_serializable import register_deserializable
  11. from embedchain.llm.base import BaseLlm
  12. @register_deserializable
  13. class GroqLlm(BaseLlm):
  14. def __init__(self, config: Optional[BaseLlmConfig] = None):
  15. super().__init__(config=config)
  16. if not self.config.api_key and "GROQ_API_KEY" not in os.environ:
  17. raise ValueError("Please set the GROQ_API_KEY environment variable or pass it in the config.")
  18. def get_llm_model_answer(self, prompt) -> tuple[str, Optional[dict[str, Any]]]:
  19. if self.config.token_usage:
  20. response, token_info = self._get_answer(prompt, self.config)
  21. model_name = "groq/" + self.config.model
  22. if model_name not in self.config.model_pricing_map:
  23. raise ValueError(
  24. f"Model {model_name} not found in `model_prices_and_context_window.json`. \
  25. You can disable token usage by setting `token_usage` to False."
  26. )
  27. total_cost = (
  28. self.config.model_pricing_map[model_name]["input_cost_per_token"] * token_info["prompt_tokens"]
  29. ) + self.config.model_pricing_map[model_name]["output_cost_per_token"] * token_info["completion_tokens"]
  30. response_token_info = {
  31. "prompt_tokens": token_info["prompt_tokens"],
  32. "completion_tokens": token_info["completion_tokens"],
  33. "total_tokens": token_info["prompt_tokens"] + token_info["completion_tokens"],
  34. "total_cost": round(total_cost, 10),
  35. "cost_currency": "USD",
  36. }
  37. return response, response_token_info
  38. return self._get_answer(prompt, self.config)
  39. def _get_answer(self, prompt: str, config: BaseLlmConfig) -> str:
  40. messages = []
  41. if config.system_prompt:
  42. messages.append(SystemMessage(content=config.system_prompt))
  43. messages.append(HumanMessage(content=prompt))
  44. api_key = config.api_key or os.environ["GROQ_API_KEY"]
  45. kwargs = {
  46. "model_name": config.model or "mixtral-8x7b-32768",
  47. "temperature": config.temperature,
  48. "groq_api_key": api_key,
  49. }
  50. if config.stream:
  51. callbacks = config.callbacks if config.callbacks else [StreamingStdOutCallbackHandler()]
  52. chat = ChatGroq(**kwargs, streaming=config.stream, callbacks=callbacks, api_key=api_key)
  53. else:
  54. chat = ChatGroq(**kwargs)
  55. chat_response = chat.invoke(prompt)
  56. if self.config.token_usage:
  57. return chat_response.content, chat_response.response_metadata["token_usage"]
  58. return chat_response.content