model_manager.py 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257
  1. from collections.abc import Generator
  2. from typing import IO, Optional, Union, cast
  3. from core.entities.provider_configuration import ProviderModelBundle
  4. from core.errors.error import ProviderTokenNotInitError
  5. from core.model_runtime.callbacks.base_callback import Callback
  6. from core.model_runtime.entities.llm_entities import LLMResult
  7. from core.model_runtime.entities.message_entities import PromptMessage, PromptMessageTool
  8. from core.model_runtime.entities.model_entities import ModelType
  9. from core.model_runtime.entities.rerank_entities import RerankResult
  10. from core.model_runtime.entities.text_embedding_entities import TextEmbeddingResult
  11. from core.model_runtime.model_providers.__base.large_language_model import LargeLanguageModel
  12. from core.model_runtime.model_providers.__base.moderation_model import ModerationModel
  13. from core.model_runtime.model_providers.__base.rerank_model import RerankModel
  14. from core.model_runtime.model_providers.__base.speech2text_model import Speech2TextModel
  15. from core.model_runtime.model_providers.__base.text_embedding_model import TextEmbeddingModel
  16. from core.model_runtime.model_providers.__base.tts_model import TTSModel
  17. from core.provider_manager import ProviderManager
  18. class ModelInstance:
  19. """
  20. Model instance class
  21. """
  22. def __init__(self, provider_model_bundle: ProviderModelBundle, model: str) -> None:
  23. self.provider_model_bundle = provider_model_bundle
  24. self.model = model
  25. self.provider = provider_model_bundle.configuration.provider.provider
  26. self.credentials = self._fetch_credentials_from_bundle(provider_model_bundle, model)
  27. self.model_type_instance = self.provider_model_bundle.model_type_instance
  28. def _fetch_credentials_from_bundle(self, provider_model_bundle: ProviderModelBundle, model: str) -> dict:
  29. """
  30. Fetch credentials from provider model bundle
  31. :param provider_model_bundle: provider model bundle
  32. :param model: model name
  33. :return:
  34. """
  35. credentials = provider_model_bundle.configuration.get_current_credentials(
  36. model_type=provider_model_bundle.model_type_instance.model_type,
  37. model=model
  38. )
  39. if credentials is None:
  40. raise ProviderTokenNotInitError(f"Model {model} credentials is not initialized.")
  41. return credentials
  42. def invoke_llm(self, prompt_messages: list[PromptMessage], model_parameters: Optional[dict] = None,
  43. tools: Optional[list[PromptMessageTool]] = None, stop: Optional[list[str]] = None,
  44. stream: bool = True, user: Optional[str] = None, callbacks: list[Callback] = None) \
  45. -> Union[LLMResult, Generator]:
  46. """
  47. Invoke large language model
  48. :param prompt_messages: prompt messages
  49. :param model_parameters: model parameters
  50. :param tools: tools for tool calling
  51. :param stop: stop words
  52. :param stream: is stream response
  53. :param user: unique user id
  54. :param callbacks: callbacks
  55. :return: full response or stream response chunk generator result
  56. """
  57. if not isinstance(self.model_type_instance, LargeLanguageModel):
  58. raise Exception("Model type instance is not LargeLanguageModel")
  59. self.model_type_instance = cast(LargeLanguageModel, self.model_type_instance)
  60. return self.model_type_instance.invoke(
  61. model=self.model,
  62. credentials=self.credentials,
  63. prompt_messages=prompt_messages,
  64. model_parameters=model_parameters,
  65. tools=tools,
  66. stop=stop,
  67. stream=stream,
  68. user=user,
  69. callbacks=callbacks
  70. )
  71. def invoke_text_embedding(self, texts: list[str], user: Optional[str] = None) \
  72. -> TextEmbeddingResult:
  73. """
  74. Invoke large language model
  75. :param texts: texts to embed
  76. :param user: unique user id
  77. :return: embeddings result
  78. """
  79. if not isinstance(self.model_type_instance, TextEmbeddingModel):
  80. raise Exception("Model type instance is not TextEmbeddingModel")
  81. self.model_type_instance = cast(TextEmbeddingModel, self.model_type_instance)
  82. return self.model_type_instance.invoke(
  83. model=self.model,
  84. credentials=self.credentials,
  85. texts=texts,
  86. user=user
  87. )
  88. def invoke_rerank(self, query: str, docs: list[str], score_threshold: Optional[float] = None,
  89. top_n: Optional[int] = None,
  90. user: Optional[str] = None) \
  91. -> RerankResult:
  92. """
  93. Invoke rerank model
  94. :param query: search query
  95. :param docs: docs for reranking
  96. :param score_threshold: score threshold
  97. :param top_n: top n
  98. :param user: unique user id
  99. :return: rerank result
  100. """
  101. if not isinstance(self.model_type_instance, RerankModel):
  102. raise Exception("Model type instance is not RerankModel")
  103. self.model_type_instance = cast(RerankModel, self.model_type_instance)
  104. return self.model_type_instance.invoke(
  105. model=self.model,
  106. credentials=self.credentials,
  107. query=query,
  108. docs=docs,
  109. score_threshold=score_threshold,
  110. top_n=top_n,
  111. user=user
  112. )
  113. def invoke_moderation(self, text: str, user: Optional[str] = None) \
  114. -> bool:
  115. """
  116. Invoke moderation model
  117. :param text: text to moderate
  118. :param user: unique user id
  119. :return: false if text is safe, true otherwise
  120. """
  121. if not isinstance(self.model_type_instance, ModerationModel):
  122. raise Exception("Model type instance is not ModerationModel")
  123. self.model_type_instance = cast(ModerationModel, self.model_type_instance)
  124. return self.model_type_instance.invoke(
  125. model=self.model,
  126. credentials=self.credentials,
  127. text=text,
  128. user=user
  129. )
  130. def invoke_speech2text(self, file: IO[bytes], user: Optional[str] = None) \
  131. -> str:
  132. """
  133. Invoke large language model
  134. :param file: audio file
  135. :param user: unique user id
  136. :return: text for given audio file
  137. """
  138. if not isinstance(self.model_type_instance, Speech2TextModel):
  139. raise Exception("Model type instance is not Speech2TextModel")
  140. self.model_type_instance = cast(Speech2TextModel, self.model_type_instance)
  141. return self.model_type_instance.invoke(
  142. model=self.model,
  143. credentials=self.credentials,
  144. file=file,
  145. user=user
  146. )
  147. def invoke_tts(self, content_text: str, tenant_id: str, voice: str, streaming: bool, user: Optional[str] = None) \
  148. -> str:
  149. """
  150. Invoke large language tts model
  151. :param content_text: text content to be translated
  152. :param tenant_id: user tenant id
  153. :param user: unique user id
  154. :param voice: model timbre
  155. :param streaming: output is streaming
  156. :return: text for given audio file
  157. """
  158. if not isinstance(self.model_type_instance, TTSModel):
  159. raise Exception("Model type instance is not TTSModel")
  160. self.model_type_instance = cast(TTSModel, self.model_type_instance)
  161. return self.model_type_instance.invoke(
  162. model=self.model,
  163. credentials=self.credentials,
  164. content_text=content_text,
  165. user=user,
  166. tenant_id=tenant_id,
  167. voice=voice,
  168. streaming=streaming
  169. )
  170. def get_tts_voices(self, language: str) -> list:
  171. """
  172. Invoke large language tts model voices
  173. :param language: tts language
  174. :return: tts model voices
  175. """
  176. if not isinstance(self.model_type_instance, TTSModel):
  177. raise Exception("Model type instance is not TTSModel")
  178. self.model_type_instance = cast(TTSModel, self.model_type_instance)
  179. return self.model_type_instance.get_tts_model_voices(
  180. model=self.model,
  181. credentials=self.credentials,
  182. language=language
  183. )
  184. class ModelManager:
  185. def __init__(self) -> None:
  186. self._provider_manager = ProviderManager()
  187. def get_model_instance(self, tenant_id: str, provider: str, model_type: ModelType, model: str) -> ModelInstance:
  188. """
  189. Get model instance
  190. :param tenant_id: tenant id
  191. :param provider: provider name
  192. :param model_type: model type
  193. :param model: model name
  194. :return:
  195. """
  196. if not provider:
  197. return self.get_default_model_instance(tenant_id, model_type)
  198. provider_model_bundle = self._provider_manager.get_provider_model_bundle(
  199. tenant_id=tenant_id,
  200. provider=provider,
  201. model_type=model_type
  202. )
  203. return ModelInstance(provider_model_bundle, model)
  204. def get_default_model_instance(self, tenant_id: str, model_type: ModelType) -> ModelInstance:
  205. """
  206. Get default model instance
  207. :param tenant_id: tenant id
  208. :param model_type: model type
  209. :return:
  210. """
  211. default_model_entity = self._provider_manager.get_default_model(
  212. tenant_id=tenant_id,
  213. model_type=model_type
  214. )
  215. if not default_model_entity:
  216. raise ProviderTokenNotInitError(f"Default model not found for {model_type}")
  217. return self.get_model_instance(
  218. tenant_id=tenant_id,
  219. provider=default_model_entity.provider.provider,
  220. model_type=model_type,
  221. model=default_model_entity.model
  222. )