simple_prompt_transform.py 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323
  1. import enum
  2. import json
  3. import os
  4. from typing import TYPE_CHECKING, Optional
  5. from core.app.app_config.entities import PromptTemplateEntity
  6. from core.app.entities.app_invoke_entities import ModelConfigWithCredentialsEntity
  7. from core.memory.token_buffer_memory import TokenBufferMemory
  8. from core.model_runtime.entities.message_entities import (
  9. PromptMessage,
  10. SystemPromptMessage,
  11. TextPromptMessageContent,
  12. UserPromptMessage,
  13. )
  14. from core.prompt.entities.advanced_prompt_entities import MemoryConfig
  15. from core.prompt.prompt_transform import PromptTransform
  16. from core.prompt.utils.prompt_template_parser import PromptTemplateParser
  17. from models.model import AppMode
  18. if TYPE_CHECKING:
  19. from core.file.file_obj import FileVar
  20. class ModelMode(enum.Enum):
  21. COMPLETION = "completion"
  22. CHAT = "chat"
  23. @classmethod
  24. def value_of(cls, value: str) -> "ModelMode":
  25. """
  26. Get value of given mode.
  27. :param value: mode value
  28. :return: mode
  29. """
  30. for mode in cls:
  31. if mode.value == value:
  32. return mode
  33. raise ValueError(f"invalid mode value {value}")
  34. prompt_file_contents = {}
  35. class SimplePromptTransform(PromptTransform):
  36. """
  37. Simple Prompt Transform for Chatbot App Basic Mode.
  38. """
  39. def get_prompt(
  40. self,
  41. app_mode: AppMode,
  42. prompt_template_entity: PromptTemplateEntity,
  43. inputs: dict,
  44. query: str,
  45. files: list["FileVar"],
  46. context: Optional[str],
  47. memory: Optional[TokenBufferMemory],
  48. model_config: ModelConfigWithCredentialsEntity,
  49. ) -> tuple[list[PromptMessage], Optional[list[str]]]:
  50. inputs = {key: str(value) for key, value in inputs.items()}
  51. model_mode = ModelMode.value_of(model_config.mode)
  52. if model_mode == ModelMode.CHAT:
  53. prompt_messages, stops = self._get_chat_model_prompt_messages(
  54. app_mode=app_mode,
  55. pre_prompt=prompt_template_entity.simple_prompt_template,
  56. inputs=inputs,
  57. query=query,
  58. files=files,
  59. context=context,
  60. memory=memory,
  61. model_config=model_config,
  62. )
  63. else:
  64. prompt_messages, stops = self._get_completion_model_prompt_messages(
  65. app_mode=app_mode,
  66. pre_prompt=prompt_template_entity.simple_prompt_template,
  67. inputs=inputs,
  68. query=query,
  69. files=files,
  70. context=context,
  71. memory=memory,
  72. model_config=model_config,
  73. )
  74. return prompt_messages, stops
  75. def get_prompt_str_and_rules(
  76. self,
  77. app_mode: AppMode,
  78. model_config: ModelConfigWithCredentialsEntity,
  79. pre_prompt: str,
  80. inputs: dict,
  81. query: Optional[str] = None,
  82. context: Optional[str] = None,
  83. histories: Optional[str] = None,
  84. ) -> tuple[str, dict]:
  85. # get prompt template
  86. prompt_template_config = self.get_prompt_template(
  87. app_mode=app_mode,
  88. provider=model_config.provider,
  89. model=model_config.model,
  90. pre_prompt=pre_prompt,
  91. has_context=context is not None,
  92. query_in_prompt=query is not None,
  93. with_memory_prompt=histories is not None,
  94. )
  95. variables = {k: inputs[k] for k in prompt_template_config["custom_variable_keys"] if k in inputs}
  96. for v in prompt_template_config["special_variable_keys"]:
  97. # support #context#, #query# and #histories#
  98. if v == "#context#":
  99. variables["#context#"] = context or ""
  100. elif v == "#query#":
  101. variables["#query#"] = query or ""
  102. elif v == "#histories#":
  103. variables["#histories#"] = histories or ""
  104. prompt_template = prompt_template_config["prompt_template"]
  105. prompt = prompt_template.format(variables)
  106. return prompt, prompt_template_config["prompt_rules"]
  107. def get_prompt_template(
  108. self,
  109. app_mode: AppMode,
  110. provider: str,
  111. model: str,
  112. pre_prompt: str,
  113. has_context: bool,
  114. query_in_prompt: bool,
  115. with_memory_prompt: bool = False,
  116. ) -> dict:
  117. prompt_rules = self._get_prompt_rule(app_mode=app_mode, provider=provider, model=model)
  118. custom_variable_keys = []
  119. special_variable_keys = []
  120. prompt = ""
  121. for order in prompt_rules["system_prompt_orders"]:
  122. if order == "context_prompt" and has_context:
  123. prompt += prompt_rules["context_prompt"]
  124. special_variable_keys.append("#context#")
  125. elif order == "pre_prompt" and pre_prompt:
  126. prompt += pre_prompt + "\n"
  127. pre_prompt_template = PromptTemplateParser(template=pre_prompt)
  128. custom_variable_keys = pre_prompt_template.variable_keys
  129. elif order == "histories_prompt" and with_memory_prompt:
  130. prompt += prompt_rules["histories_prompt"]
  131. special_variable_keys.append("#histories#")
  132. if query_in_prompt:
  133. prompt += prompt_rules.get("query_prompt", "{{#query#}}")
  134. special_variable_keys.append("#query#")
  135. return {
  136. "prompt_template": PromptTemplateParser(template=prompt),
  137. "custom_variable_keys": custom_variable_keys,
  138. "special_variable_keys": special_variable_keys,
  139. "prompt_rules": prompt_rules,
  140. }
  141. def _get_chat_model_prompt_messages(
  142. self,
  143. app_mode: AppMode,
  144. pre_prompt: str,
  145. inputs: dict,
  146. query: str,
  147. context: Optional[str],
  148. files: list["FileVar"],
  149. memory: Optional[TokenBufferMemory],
  150. model_config: ModelConfigWithCredentialsEntity,
  151. ) -> tuple[list[PromptMessage], Optional[list[str]]]:
  152. prompt_messages = []
  153. # get prompt
  154. prompt, _ = self.get_prompt_str_and_rules(
  155. app_mode=app_mode,
  156. model_config=model_config,
  157. pre_prompt=pre_prompt,
  158. inputs=inputs,
  159. query=None,
  160. context=context,
  161. )
  162. if prompt and query:
  163. prompt_messages.append(SystemPromptMessage(content=prompt))
  164. if memory:
  165. prompt_messages = self._append_chat_histories(
  166. memory=memory,
  167. memory_config=MemoryConfig(
  168. window=MemoryConfig.WindowConfig(
  169. enabled=False,
  170. )
  171. ),
  172. prompt_messages=prompt_messages,
  173. model_config=model_config,
  174. )
  175. if query:
  176. prompt_messages.append(self.get_last_user_message(query, files))
  177. else:
  178. prompt_messages.append(self.get_last_user_message(prompt, files))
  179. return prompt_messages, None
  180. def _get_completion_model_prompt_messages(
  181. self,
  182. app_mode: AppMode,
  183. pre_prompt: str,
  184. inputs: dict,
  185. query: str,
  186. context: Optional[str],
  187. files: list["FileVar"],
  188. memory: Optional[TokenBufferMemory],
  189. model_config: ModelConfigWithCredentialsEntity,
  190. ) -> tuple[list[PromptMessage], Optional[list[str]]]:
  191. # get prompt
  192. prompt, prompt_rules = self.get_prompt_str_and_rules(
  193. app_mode=app_mode,
  194. model_config=model_config,
  195. pre_prompt=pre_prompt,
  196. inputs=inputs,
  197. query=query,
  198. context=context,
  199. )
  200. if memory:
  201. tmp_human_message = UserPromptMessage(content=prompt)
  202. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  203. histories = self._get_history_messages_from_memory(
  204. memory=memory,
  205. memory_config=MemoryConfig(
  206. window=MemoryConfig.WindowConfig(
  207. enabled=False,
  208. )
  209. ),
  210. max_token_limit=rest_tokens,
  211. human_prefix=prompt_rules.get("human_prefix", "Human"),
  212. ai_prefix=prompt_rules.get("assistant_prefix", "Assistant"),
  213. )
  214. # get prompt
  215. prompt, prompt_rules = self.get_prompt_str_and_rules(
  216. app_mode=app_mode,
  217. model_config=model_config,
  218. pre_prompt=pre_prompt,
  219. inputs=inputs,
  220. query=query,
  221. context=context,
  222. histories=histories,
  223. )
  224. stops = prompt_rules.get("stops")
  225. if stops is not None and len(stops) == 0:
  226. stops = None
  227. return [self.get_last_user_message(prompt, files)], stops
  228. def get_last_user_message(self, prompt: str, files: list["FileVar"]) -> UserPromptMessage:
  229. if files:
  230. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  231. for file in files:
  232. prompt_message_contents.append(file.prompt_message_content)
  233. prompt_message = UserPromptMessage(content=prompt_message_contents)
  234. else:
  235. prompt_message = UserPromptMessage(content=prompt)
  236. return prompt_message
  237. def _get_prompt_rule(self, app_mode: AppMode, provider: str, model: str) -> dict:
  238. """
  239. Get simple prompt rule.
  240. :param app_mode: app mode
  241. :param provider: model provider
  242. :param model: model name
  243. :return:
  244. """
  245. prompt_file_name = self._prompt_file_name(app_mode=app_mode, provider=provider, model=model)
  246. # Check if the prompt file is already loaded
  247. if prompt_file_name in prompt_file_contents:
  248. return prompt_file_contents[prompt_file_name]
  249. # Get the absolute path of the subdirectory
  250. prompt_path = os.path.join(os.path.dirname(os.path.realpath(__file__)), "prompt_templates")
  251. json_file_path = os.path.join(prompt_path, f"{prompt_file_name}.json")
  252. # Open the JSON file and read its content
  253. with open(json_file_path, encoding="utf-8") as json_file:
  254. content = json.load(json_file)
  255. # Store the content of the prompt file
  256. prompt_file_contents[prompt_file_name] = content
  257. return content
  258. def _prompt_file_name(self, app_mode: AppMode, provider: str, model: str) -> str:
  259. # baichuan
  260. is_baichuan = False
  261. if provider == "baichuan":
  262. is_baichuan = True
  263. else:
  264. baichuan_supported_providers = ["huggingface_hub", "openllm", "xinference"]
  265. if provider in baichuan_supported_providers and "baichuan" in model.lower():
  266. is_baichuan = True
  267. if is_baichuan:
  268. if app_mode == AppMode.COMPLETION:
  269. return "baichuan_completion"
  270. else:
  271. return "baichuan_chat"
  272. # common
  273. if app_mode == AppMode.COMPLETION:
  274. return "common_completion"
  275. else:
  276. return "common_chat"