prompt_transform.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582
  1. import enum
  2. import json
  3. import os
  4. import re
  5. from typing import List, Optional, Tuple, cast
  6. from core.entities.application_entities import (AdvancedCompletionPromptTemplateEntity, ModelConfigEntity,
  7. PromptTemplateEntity)
  8. from core.file.file_obj import FileObj
  9. from core.memory.token_buffer_memory import TokenBufferMemory
  10. from core.model_runtime.entities.message_entities import (AssistantPromptMessage, PromptMessage, PromptMessageRole,
  11. SystemPromptMessage, TextPromptMessageContent,
  12. UserPromptMessage)
  13. from core.model_runtime.entities.model_entities import ModelPropertyKey
  14. from core.model_runtime.model_providers.__base.large_language_model import LargeLanguageModel
  15. from core.prompt.prompt_builder import PromptBuilder
  16. from core.prompt.prompt_template import PromptTemplateParser
  17. class AppMode(enum.Enum):
  18. COMPLETION = 'completion'
  19. CHAT = 'chat'
  20. @classmethod
  21. def value_of(cls, value: str) -> 'AppMode':
  22. """
  23. Get value of given mode.
  24. :param value: mode value
  25. :return: mode
  26. """
  27. for mode in cls:
  28. if mode.value == value:
  29. return mode
  30. raise ValueError(f'invalid mode value {value}')
  31. class ModelMode(enum.Enum):
  32. COMPLETION = 'completion'
  33. CHAT = 'chat'
  34. @classmethod
  35. def value_of(cls, value: str) -> 'ModelMode':
  36. """
  37. Get value of given mode.
  38. :param value: mode value
  39. :return: mode
  40. """
  41. for mode in cls:
  42. if mode.value == value:
  43. return mode
  44. raise ValueError(f'invalid mode value {value}')
  45. class PromptTransform:
  46. def get_prompt(self,
  47. app_mode: str,
  48. prompt_template_entity: PromptTemplateEntity,
  49. inputs: dict,
  50. query: str,
  51. files: List[FileObj],
  52. context: Optional[str],
  53. memory: Optional[TokenBufferMemory],
  54. model_config: ModelConfigEntity) -> \
  55. Tuple[List[PromptMessage], Optional[List[str]]]:
  56. app_mode = AppMode.value_of(app_mode)
  57. model_mode = ModelMode.value_of(model_config.mode)
  58. prompt_rules = self._read_prompt_rules_from_file(self._prompt_file_name(
  59. app_mode=app_mode,
  60. provider=model_config.provider,
  61. model=model_config.model
  62. ))
  63. if app_mode == AppMode.CHAT and model_mode == ModelMode.CHAT:
  64. stops = None
  65. prompt_messages = self._get_simple_chat_app_chat_model_prompt_messages(
  66. prompt_rules=prompt_rules,
  67. pre_prompt=prompt_template_entity.simple_prompt_template,
  68. inputs=inputs,
  69. query=query,
  70. files=files,
  71. context=context,
  72. memory=memory,
  73. model_config=model_config
  74. )
  75. else:
  76. stops = prompt_rules.get('stops')
  77. if stops is not None and len(stops) == 0:
  78. stops = None
  79. prompt_messages = self._get_simple_others_prompt_messages(
  80. prompt_rules=prompt_rules,
  81. pre_prompt=prompt_template_entity.simple_prompt_template,
  82. inputs=inputs,
  83. query=query,
  84. files=files,
  85. context=context,
  86. memory=memory,
  87. model_config=model_config
  88. )
  89. return prompt_messages, stops
  90. def get_advanced_prompt(self, app_mode: str,
  91. prompt_template_entity: PromptTemplateEntity,
  92. inputs: dict,
  93. query: str,
  94. files: List[FileObj],
  95. context: Optional[str],
  96. memory: Optional[TokenBufferMemory],
  97. model_config: ModelConfigEntity) -> List[PromptMessage]:
  98. app_mode = AppMode.value_of(app_mode)
  99. model_mode = ModelMode.value_of(model_config.mode)
  100. prompt_messages = []
  101. if app_mode == AppMode.CHAT:
  102. if model_mode == ModelMode.COMPLETION:
  103. prompt_messages = self._get_chat_app_completion_model_prompt_messages(
  104. prompt_template_entity=prompt_template_entity,
  105. inputs=inputs,
  106. query=query,
  107. files=files,
  108. context=context,
  109. memory=memory,
  110. model_config=model_config
  111. )
  112. elif model_mode == ModelMode.CHAT:
  113. prompt_messages = self._get_chat_app_chat_model_prompt_messages(
  114. prompt_template_entity=prompt_template_entity,
  115. inputs=inputs,
  116. query=query,
  117. files=files,
  118. context=context,
  119. memory=memory,
  120. model_config=model_config
  121. )
  122. elif app_mode == AppMode.COMPLETION:
  123. if model_mode == ModelMode.CHAT:
  124. prompt_messages = self._get_completion_app_chat_model_prompt_messages(
  125. prompt_template_entity=prompt_template_entity,
  126. inputs=inputs,
  127. files=files,
  128. context=context,
  129. )
  130. elif model_mode == ModelMode.COMPLETION:
  131. prompt_messages = self._get_completion_app_completion_model_prompt_messages(
  132. prompt_template_entity=prompt_template_entity,
  133. inputs=inputs,
  134. context=context,
  135. )
  136. return prompt_messages
  137. def _get_history_messages_from_memory(self, memory: TokenBufferMemory,
  138. max_token_limit: int,
  139. human_prefix: Optional[str] = None,
  140. ai_prefix: Optional[str] = None) -> str:
  141. """Get memory messages."""
  142. kwargs = {
  143. "max_token_limit": max_token_limit
  144. }
  145. if human_prefix:
  146. kwargs['human_prefix'] = human_prefix
  147. if ai_prefix:
  148. kwargs['ai_prefix'] = ai_prefix
  149. return memory.get_history_prompt_text(
  150. **kwargs
  151. )
  152. def _get_history_messages_list_from_memory(self, memory: TokenBufferMemory,
  153. max_token_limit: int) -> List[PromptMessage]:
  154. """Get memory messages."""
  155. return memory.get_history_prompt_messages(
  156. max_token_limit=max_token_limit
  157. )
  158. def _prompt_file_name(self, app_mode: AppMode, provider: str, model: str) -> str:
  159. # baichuan
  160. if provider == 'baichuan':
  161. return self._prompt_file_name_for_baichuan(app_mode)
  162. baichuan_supported_providers = ["huggingface_hub", "openllm", "xinference"]
  163. if provider in baichuan_supported_providers and 'baichuan' in model.lower():
  164. return self._prompt_file_name_for_baichuan(app_mode)
  165. # common
  166. if app_mode == AppMode.COMPLETION:
  167. return 'common_completion'
  168. else:
  169. return 'common_chat'
  170. def _prompt_file_name_for_baichuan(self, app_mode: AppMode) -> str:
  171. if app_mode == AppMode.COMPLETION:
  172. return 'baichuan_completion'
  173. else:
  174. return 'baichuan_chat'
  175. def _read_prompt_rules_from_file(self, prompt_name: str) -> dict:
  176. # Get the absolute path of the subdirectory
  177. prompt_path = os.path.join(
  178. os.path.dirname(os.path.realpath(__file__)),
  179. 'generate_prompts')
  180. json_file_path = os.path.join(prompt_path, f'{prompt_name}.json')
  181. # Open the JSON file and read its content
  182. with open(json_file_path, 'r', encoding='utf-8') as json_file:
  183. return json.load(json_file)
  184. def _get_simple_chat_app_chat_model_prompt_messages(self, prompt_rules: dict,
  185. pre_prompt: str,
  186. inputs: dict,
  187. query: str,
  188. context: Optional[str],
  189. files: List[FileObj],
  190. memory: Optional[TokenBufferMemory],
  191. model_config: ModelConfigEntity) -> List[PromptMessage]:
  192. prompt_messages = []
  193. context_prompt_content = ''
  194. if context and 'context_prompt' in prompt_rules:
  195. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  196. context_prompt_content = prompt_template.format(
  197. {'context': context}
  198. )
  199. pre_prompt_content = ''
  200. if pre_prompt:
  201. prompt_template = PromptTemplateParser(template=pre_prompt)
  202. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  203. pre_prompt_content = prompt_template.format(
  204. prompt_inputs
  205. )
  206. prompt = ''
  207. for order in prompt_rules['system_prompt_orders']:
  208. if order == 'context_prompt':
  209. prompt += context_prompt_content
  210. elif order == 'pre_prompt':
  211. prompt += pre_prompt_content
  212. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  213. if prompt:
  214. prompt_messages.append(SystemPromptMessage(content=prompt))
  215. self._append_chat_histories(
  216. memory=memory,
  217. prompt_messages=prompt_messages,
  218. model_config=model_config
  219. )
  220. if files:
  221. prompt_message_contents = [TextPromptMessageContent(data=query)]
  222. for file in files:
  223. prompt_message_contents.append(file.prompt_message_content)
  224. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  225. else:
  226. prompt_messages.append(UserPromptMessage(content=query))
  227. return prompt_messages
  228. def _get_simple_others_prompt_messages(self, prompt_rules: dict,
  229. pre_prompt: str,
  230. inputs: dict,
  231. query: str,
  232. context: Optional[str],
  233. memory: Optional[TokenBufferMemory],
  234. files: List[FileObj],
  235. model_config: ModelConfigEntity) -> List[PromptMessage]:
  236. context_prompt_content = ''
  237. if context and 'context_prompt' in prompt_rules:
  238. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  239. context_prompt_content = prompt_template.format(
  240. {'context': context}
  241. )
  242. pre_prompt_content = ''
  243. if pre_prompt:
  244. prompt_template = PromptTemplateParser(template=pre_prompt)
  245. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  246. pre_prompt_content = prompt_template.format(
  247. prompt_inputs
  248. )
  249. prompt = ''
  250. for order in prompt_rules['system_prompt_orders']:
  251. if order == 'context_prompt':
  252. prompt += context_prompt_content
  253. elif order == 'pre_prompt':
  254. prompt += pre_prompt_content
  255. query_prompt = prompt_rules['query_prompt'] if 'query_prompt' in prompt_rules else '{{query}}'
  256. if memory and 'histories_prompt' in prompt_rules:
  257. # append chat histories
  258. tmp_human_message = UserPromptMessage(
  259. content=PromptBuilder.parse_prompt(
  260. prompt=prompt + query_prompt,
  261. inputs={
  262. 'query': query
  263. }
  264. )
  265. )
  266. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  267. histories = self._get_history_messages_from_memory(
  268. memory=memory,
  269. max_token_limit=rest_tokens,
  270. ai_prefix=prompt_rules['human_prefix'] if 'human_prefix' in prompt_rules else 'Human',
  271. human_prefix=prompt_rules['assistant_prefix'] if 'assistant_prefix' in prompt_rules else 'Assistant'
  272. )
  273. prompt_template = PromptTemplateParser(template=prompt_rules['histories_prompt'])
  274. histories_prompt_content = prompt_template.format({'histories': histories})
  275. prompt = ''
  276. for order in prompt_rules['system_prompt_orders']:
  277. if order == 'context_prompt':
  278. prompt += context_prompt_content
  279. elif order == 'pre_prompt':
  280. prompt += (pre_prompt_content + '\n') if pre_prompt_content else ''
  281. elif order == 'histories_prompt':
  282. prompt += histories_prompt_content
  283. prompt_template = PromptTemplateParser(template=query_prompt)
  284. query_prompt_content = prompt_template.format({'query': query})
  285. prompt += query_prompt_content
  286. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  287. model_mode = ModelMode.value_of(model_config.mode)
  288. if model_mode == ModelMode.CHAT and files:
  289. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  290. for file in files:
  291. prompt_message_contents.append(file.prompt_message_content)
  292. prompt_message = UserPromptMessage(content=prompt_message_contents)
  293. else:
  294. if files:
  295. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  296. for file in files:
  297. prompt_message_contents.append(file.prompt_message_content)
  298. prompt_message = UserPromptMessage(content=prompt_message_contents)
  299. else:
  300. prompt_message = UserPromptMessage(content=prompt)
  301. return [prompt_message]
  302. def _set_context_variable(self, context: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  303. if '#context#' in prompt_template.variable_keys:
  304. if context:
  305. prompt_inputs['#context#'] = context
  306. else:
  307. prompt_inputs['#context#'] = ''
  308. def _set_query_variable(self, query: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  309. if '#query#' in prompt_template.variable_keys:
  310. if query:
  311. prompt_inputs['#query#'] = query
  312. else:
  313. prompt_inputs['#query#'] = ''
  314. def _set_histories_variable(self, memory: TokenBufferMemory,
  315. raw_prompt: str,
  316. role_prefix: AdvancedCompletionPromptTemplateEntity.RolePrefixEntity,
  317. prompt_template: PromptTemplateParser,
  318. prompt_inputs: dict,
  319. model_config: ModelConfigEntity) -> None:
  320. if '#histories#' in prompt_template.variable_keys:
  321. if memory:
  322. tmp_human_message = UserPromptMessage(
  323. content=PromptBuilder.parse_prompt(
  324. prompt=raw_prompt,
  325. inputs={'#histories#': '', **prompt_inputs}
  326. )
  327. )
  328. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  329. histories = self._get_history_messages_from_memory(
  330. memory=memory,
  331. max_token_limit=rest_tokens,
  332. human_prefix=role_prefix.user,
  333. ai_prefix=role_prefix.assistant
  334. )
  335. prompt_inputs['#histories#'] = histories
  336. else:
  337. prompt_inputs['#histories#'] = ''
  338. def _append_chat_histories(self, memory: TokenBufferMemory,
  339. prompt_messages: list[PromptMessage],
  340. model_config: ModelConfigEntity) -> None:
  341. if memory:
  342. rest_tokens = self._calculate_rest_token(prompt_messages, model_config)
  343. histories = self._get_history_messages_list_from_memory(memory, rest_tokens)
  344. prompt_messages.extend(histories)
  345. def _calculate_rest_token(self, prompt_messages: list[PromptMessage], model_config: ModelConfigEntity) -> int:
  346. rest_tokens = 2000
  347. model_context_tokens = model_config.model_schema.model_properties.get(ModelPropertyKey.CONTEXT_SIZE)
  348. if model_context_tokens:
  349. model_type_instance = model_config.provider_model_bundle.model_type_instance
  350. model_type_instance = cast(LargeLanguageModel, model_type_instance)
  351. curr_message_tokens = model_type_instance.get_num_tokens(
  352. model_config.model,
  353. model_config.credentials,
  354. prompt_messages
  355. )
  356. max_tokens = 0
  357. for parameter_rule in model_config.model_schema.parameter_rules:
  358. if (parameter_rule.name == 'max_tokens'
  359. or (parameter_rule.use_template and parameter_rule.use_template == 'max_tokens')):
  360. max_tokens = (model_config.parameters.get(parameter_rule.name)
  361. or model_config.parameters.get(parameter_rule.use_template)) or 0
  362. rest_tokens = model_context_tokens - max_tokens - curr_message_tokens
  363. rest_tokens = max(rest_tokens, 0)
  364. return rest_tokens
  365. def _format_prompt(self, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> str:
  366. prompt = prompt_template.format(
  367. prompt_inputs
  368. )
  369. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  370. return prompt
  371. def _get_chat_app_completion_model_prompt_messages(self,
  372. prompt_template_entity: PromptTemplateEntity,
  373. inputs: dict,
  374. query: str,
  375. files: List[FileObj],
  376. context: Optional[str],
  377. memory: Optional[TokenBufferMemory],
  378. model_config: ModelConfigEntity) -> List[PromptMessage]:
  379. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  380. role_prefix = prompt_template_entity.advanced_completion_prompt_template.role_prefix
  381. prompt_messages = []
  382. prompt_template = PromptTemplateParser(template=raw_prompt)
  383. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  384. self._set_context_variable(context, prompt_template, prompt_inputs)
  385. self._set_query_variable(query, prompt_template, prompt_inputs)
  386. self._set_histories_variable(
  387. memory=memory,
  388. raw_prompt=raw_prompt,
  389. role_prefix=role_prefix,
  390. prompt_template=prompt_template,
  391. prompt_inputs=prompt_inputs,
  392. model_config=model_config
  393. )
  394. prompt = self._format_prompt(prompt_template, prompt_inputs)
  395. if files:
  396. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  397. for file in files:
  398. prompt_message_contents.append(file.prompt_message_content)
  399. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  400. else:
  401. prompt_messages.append(UserPromptMessage(content=prompt))
  402. return prompt_messages
  403. def _get_chat_app_chat_model_prompt_messages(self,
  404. prompt_template_entity: PromptTemplateEntity,
  405. inputs: dict,
  406. query: str,
  407. files: List[FileObj],
  408. context: Optional[str],
  409. memory: Optional[TokenBufferMemory],
  410. model_config: ModelConfigEntity) -> List[PromptMessage]:
  411. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  412. prompt_messages = []
  413. for prompt_item in raw_prompt_list:
  414. raw_prompt = prompt_item.text
  415. prompt_template = PromptTemplateParser(template=raw_prompt)
  416. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  417. self._set_context_variable(context, prompt_template, prompt_inputs)
  418. prompt = self._format_prompt(prompt_template, prompt_inputs)
  419. if prompt_item.role == PromptMessageRole.USER:
  420. prompt_messages.append(UserPromptMessage(content=prompt))
  421. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  422. prompt_messages.append(SystemPromptMessage(content=prompt))
  423. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  424. prompt_messages.append(AssistantPromptMessage(content=prompt))
  425. self._append_chat_histories(memory, prompt_messages, model_config)
  426. if files:
  427. prompt_message_contents = [TextPromptMessageContent(data=query)]
  428. for file in files:
  429. prompt_message_contents.append(file.prompt_message_content)
  430. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  431. else:
  432. prompt_messages.append(UserPromptMessage(content=query))
  433. return prompt_messages
  434. def _get_completion_app_completion_model_prompt_messages(self,
  435. prompt_template_entity: PromptTemplateEntity,
  436. inputs: dict,
  437. context: Optional[str]) -> List[PromptMessage]:
  438. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  439. prompt_messages = []
  440. prompt_template = PromptTemplateParser(template=raw_prompt)
  441. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  442. self._set_context_variable(context, prompt_template, prompt_inputs)
  443. prompt = self._format_prompt(prompt_template, prompt_inputs)
  444. prompt_messages.append(UserPromptMessage(content=prompt))
  445. return prompt_messages
  446. def _get_completion_app_chat_model_prompt_messages(self,
  447. prompt_template_entity: PromptTemplateEntity,
  448. inputs: dict,
  449. files: List[FileObj],
  450. context: Optional[str]) -> List[PromptMessage]:
  451. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  452. prompt_messages = []
  453. for prompt_item in raw_prompt_list:
  454. raw_prompt = prompt_item.text
  455. prompt_template = PromptTemplateParser(template=raw_prompt)
  456. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  457. self._set_context_variable(context, prompt_template, prompt_inputs)
  458. prompt = self._format_prompt(prompt_template, prompt_inputs)
  459. if prompt_item.role == PromptMessageRole.USER:
  460. prompt_messages.append(UserPromptMessage(content=prompt))
  461. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  462. prompt_messages.append(SystemPromptMessage(content=prompt))
  463. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  464. prompt_messages.append(AssistantPromptMessage(content=prompt))
  465. for prompt_message in prompt_messages[::-1]:
  466. if prompt_message.role == PromptMessageRole.USER:
  467. if files:
  468. prompt_message_contents = [TextPromptMessageContent(data=prompt_message.content)]
  469. for file in files:
  470. prompt_message_contents.append(file.prompt_message_content)
  471. prompt_message.content = prompt_message_contents
  472. break
  473. return prompt_messages