prompt_transform.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590
  1. import enum
  2. import json
  3. import os
  4. import re
  5. from typing import Optional, cast
  6. from core.entities.application_entities import (
  7. AdvancedCompletionPromptTemplateEntity,
  8. ModelConfigEntity,
  9. PromptTemplateEntity,
  10. )
  11. from core.file.file_obj import FileObj
  12. from core.memory.token_buffer_memory import TokenBufferMemory
  13. from core.model_runtime.entities.message_entities import (
  14. AssistantPromptMessage,
  15. PromptMessage,
  16. PromptMessageRole,
  17. SystemPromptMessage,
  18. TextPromptMessageContent,
  19. UserPromptMessage,
  20. )
  21. from core.model_runtime.entities.model_entities import ModelPropertyKey
  22. from core.model_runtime.model_providers.__base.large_language_model import LargeLanguageModel
  23. from core.prompt.prompt_builder import PromptBuilder
  24. from core.prompt.prompt_template import PromptTemplateParser
  25. class AppMode(enum.Enum):
  26. COMPLETION = 'completion'
  27. CHAT = 'chat'
  28. @classmethod
  29. def value_of(cls, value: str) -> 'AppMode':
  30. """
  31. Get value of given mode.
  32. :param value: mode value
  33. :return: mode
  34. """
  35. for mode in cls:
  36. if mode.value == value:
  37. return mode
  38. raise ValueError(f'invalid mode value {value}')
  39. class ModelMode(enum.Enum):
  40. COMPLETION = 'completion'
  41. CHAT = 'chat'
  42. @classmethod
  43. def value_of(cls, value: str) -> 'ModelMode':
  44. """
  45. Get value of given mode.
  46. :param value: mode value
  47. :return: mode
  48. """
  49. for mode in cls:
  50. if mode.value == value:
  51. return mode
  52. raise ValueError(f'invalid mode value {value}')
  53. class PromptTransform:
  54. def get_prompt(self,
  55. app_mode: str,
  56. prompt_template_entity: PromptTemplateEntity,
  57. inputs: dict,
  58. query: str,
  59. files: list[FileObj],
  60. context: Optional[str],
  61. memory: Optional[TokenBufferMemory],
  62. model_config: ModelConfigEntity) -> \
  63. tuple[list[PromptMessage], Optional[list[str]]]:
  64. app_mode = AppMode.value_of(app_mode)
  65. model_mode = ModelMode.value_of(model_config.mode)
  66. prompt_rules = self._read_prompt_rules_from_file(self._prompt_file_name(
  67. app_mode=app_mode,
  68. provider=model_config.provider,
  69. model=model_config.model
  70. ))
  71. if app_mode == AppMode.CHAT and model_mode == ModelMode.CHAT:
  72. stops = None
  73. prompt_messages = self._get_simple_chat_app_chat_model_prompt_messages(
  74. prompt_rules=prompt_rules,
  75. pre_prompt=prompt_template_entity.simple_prompt_template,
  76. inputs=inputs,
  77. query=query,
  78. files=files,
  79. context=context,
  80. memory=memory,
  81. model_config=model_config
  82. )
  83. else:
  84. stops = prompt_rules.get('stops')
  85. if stops is not None and len(stops) == 0:
  86. stops = None
  87. prompt_messages = self._get_simple_others_prompt_messages(
  88. prompt_rules=prompt_rules,
  89. pre_prompt=prompt_template_entity.simple_prompt_template,
  90. inputs=inputs,
  91. query=query,
  92. files=files,
  93. context=context,
  94. memory=memory,
  95. model_config=model_config
  96. )
  97. return prompt_messages, stops
  98. def get_advanced_prompt(self, app_mode: str,
  99. prompt_template_entity: PromptTemplateEntity,
  100. inputs: dict,
  101. query: str,
  102. files: list[FileObj],
  103. context: Optional[str],
  104. memory: Optional[TokenBufferMemory],
  105. model_config: ModelConfigEntity) -> list[PromptMessage]:
  106. app_mode = AppMode.value_of(app_mode)
  107. model_mode = ModelMode.value_of(model_config.mode)
  108. prompt_messages = []
  109. if app_mode == AppMode.CHAT:
  110. if model_mode == ModelMode.COMPLETION:
  111. prompt_messages = self._get_chat_app_completion_model_prompt_messages(
  112. prompt_template_entity=prompt_template_entity,
  113. inputs=inputs,
  114. query=query,
  115. files=files,
  116. context=context,
  117. memory=memory,
  118. model_config=model_config
  119. )
  120. elif model_mode == ModelMode.CHAT:
  121. prompt_messages = self._get_chat_app_chat_model_prompt_messages(
  122. prompt_template_entity=prompt_template_entity,
  123. inputs=inputs,
  124. query=query,
  125. files=files,
  126. context=context,
  127. memory=memory,
  128. model_config=model_config
  129. )
  130. elif app_mode == AppMode.COMPLETION:
  131. if model_mode == ModelMode.CHAT:
  132. prompt_messages = self._get_completion_app_chat_model_prompt_messages(
  133. prompt_template_entity=prompt_template_entity,
  134. inputs=inputs,
  135. files=files,
  136. context=context,
  137. )
  138. elif model_mode == ModelMode.COMPLETION:
  139. prompt_messages = self._get_completion_app_completion_model_prompt_messages(
  140. prompt_template_entity=prompt_template_entity,
  141. inputs=inputs,
  142. context=context,
  143. )
  144. return prompt_messages
  145. def _get_history_messages_from_memory(self, memory: TokenBufferMemory,
  146. max_token_limit: int,
  147. human_prefix: Optional[str] = None,
  148. ai_prefix: Optional[str] = None) -> str:
  149. """Get memory messages."""
  150. kwargs = {
  151. "max_token_limit": max_token_limit
  152. }
  153. if human_prefix:
  154. kwargs['human_prefix'] = human_prefix
  155. if ai_prefix:
  156. kwargs['ai_prefix'] = ai_prefix
  157. return memory.get_history_prompt_text(
  158. **kwargs
  159. )
  160. def _get_history_messages_list_from_memory(self, memory: TokenBufferMemory,
  161. max_token_limit: int) -> list[PromptMessage]:
  162. """Get memory messages."""
  163. return memory.get_history_prompt_messages(
  164. max_token_limit=max_token_limit
  165. )
  166. def _prompt_file_name(self, app_mode: AppMode, provider: str, model: str) -> str:
  167. # baichuan
  168. if provider == 'baichuan':
  169. return self._prompt_file_name_for_baichuan(app_mode)
  170. baichuan_supported_providers = ["huggingface_hub", "openllm", "xinference"]
  171. if provider in baichuan_supported_providers and 'baichuan' in model.lower():
  172. return self._prompt_file_name_for_baichuan(app_mode)
  173. # common
  174. if app_mode == AppMode.COMPLETION:
  175. return 'common_completion'
  176. else:
  177. return 'common_chat'
  178. def _prompt_file_name_for_baichuan(self, app_mode: AppMode) -> str:
  179. if app_mode == AppMode.COMPLETION:
  180. return 'baichuan_completion'
  181. else:
  182. return 'baichuan_chat'
  183. def _read_prompt_rules_from_file(self, prompt_name: str) -> dict:
  184. # Get the absolute path of the subdirectory
  185. prompt_path = os.path.join(
  186. os.path.dirname(os.path.realpath(__file__)),
  187. 'generate_prompts')
  188. json_file_path = os.path.join(prompt_path, f'{prompt_name}.json')
  189. # Open the JSON file and read its content
  190. with open(json_file_path, encoding='utf-8') as json_file:
  191. return json.load(json_file)
  192. def _get_simple_chat_app_chat_model_prompt_messages(self, prompt_rules: dict,
  193. pre_prompt: str,
  194. inputs: dict,
  195. query: str,
  196. context: Optional[str],
  197. files: list[FileObj],
  198. memory: Optional[TokenBufferMemory],
  199. model_config: ModelConfigEntity) -> list[PromptMessage]:
  200. prompt_messages = []
  201. context_prompt_content = ''
  202. if context and 'context_prompt' in prompt_rules:
  203. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  204. context_prompt_content = prompt_template.format(
  205. {'context': context}
  206. )
  207. pre_prompt_content = ''
  208. if pre_prompt:
  209. prompt_template = PromptTemplateParser(template=pre_prompt)
  210. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  211. pre_prompt_content = prompt_template.format(
  212. prompt_inputs
  213. )
  214. prompt = ''
  215. for order in prompt_rules['system_prompt_orders']:
  216. if order == 'context_prompt':
  217. prompt += context_prompt_content
  218. elif order == 'pre_prompt':
  219. prompt += pre_prompt_content
  220. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  221. if prompt:
  222. prompt_messages.append(SystemPromptMessage(content=prompt))
  223. self._append_chat_histories(
  224. memory=memory,
  225. prompt_messages=prompt_messages,
  226. model_config=model_config
  227. )
  228. if files:
  229. prompt_message_contents = [TextPromptMessageContent(data=query)]
  230. for file in files:
  231. prompt_message_contents.append(file.prompt_message_content)
  232. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  233. else:
  234. prompt_messages.append(UserPromptMessage(content=query))
  235. return prompt_messages
  236. def _get_simple_others_prompt_messages(self, prompt_rules: dict,
  237. pre_prompt: str,
  238. inputs: dict,
  239. query: str,
  240. context: Optional[str],
  241. memory: Optional[TokenBufferMemory],
  242. files: list[FileObj],
  243. model_config: ModelConfigEntity) -> list[PromptMessage]:
  244. context_prompt_content = ''
  245. if context and 'context_prompt' in prompt_rules:
  246. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  247. context_prompt_content = prompt_template.format(
  248. {'context': context}
  249. )
  250. pre_prompt_content = ''
  251. if pre_prompt:
  252. prompt_template = PromptTemplateParser(template=pre_prompt)
  253. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  254. pre_prompt_content = prompt_template.format(
  255. prompt_inputs
  256. )
  257. prompt = ''
  258. for order in prompt_rules['system_prompt_orders']:
  259. if order == 'context_prompt':
  260. prompt += context_prompt_content
  261. elif order == 'pre_prompt':
  262. prompt += pre_prompt_content
  263. query_prompt = prompt_rules['query_prompt'] if 'query_prompt' in prompt_rules else '{{query}}'
  264. if memory and 'histories_prompt' in prompt_rules:
  265. # append chat histories
  266. tmp_human_message = UserPromptMessage(
  267. content=PromptBuilder.parse_prompt(
  268. prompt=prompt + query_prompt,
  269. inputs={
  270. 'query': query
  271. }
  272. )
  273. )
  274. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  275. histories = self._get_history_messages_from_memory(
  276. memory=memory,
  277. max_token_limit=rest_tokens,
  278. ai_prefix=prompt_rules['human_prefix'] if 'human_prefix' in prompt_rules else 'Human',
  279. human_prefix=prompt_rules['assistant_prefix'] if 'assistant_prefix' in prompt_rules else 'Assistant'
  280. )
  281. prompt_template = PromptTemplateParser(template=prompt_rules['histories_prompt'])
  282. histories_prompt_content = prompt_template.format({'histories': histories})
  283. prompt = ''
  284. for order in prompt_rules['system_prompt_orders']:
  285. if order == 'context_prompt':
  286. prompt += context_prompt_content
  287. elif order == 'pre_prompt':
  288. prompt += (pre_prompt_content + '\n') if pre_prompt_content else ''
  289. elif order == 'histories_prompt':
  290. prompt += histories_prompt_content
  291. prompt_template = PromptTemplateParser(template=query_prompt)
  292. query_prompt_content = prompt_template.format({'query': query})
  293. prompt += query_prompt_content
  294. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  295. model_mode = ModelMode.value_of(model_config.mode)
  296. if model_mode == ModelMode.CHAT and files:
  297. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  298. for file in files:
  299. prompt_message_contents.append(file.prompt_message_content)
  300. prompt_message = UserPromptMessage(content=prompt_message_contents)
  301. else:
  302. if files:
  303. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  304. for file in files:
  305. prompt_message_contents.append(file.prompt_message_content)
  306. prompt_message = UserPromptMessage(content=prompt_message_contents)
  307. else:
  308. prompt_message = UserPromptMessage(content=prompt)
  309. return [prompt_message]
  310. def _set_context_variable(self, context: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  311. if '#context#' in prompt_template.variable_keys:
  312. if context:
  313. prompt_inputs['#context#'] = context
  314. else:
  315. prompt_inputs['#context#'] = ''
  316. def _set_query_variable(self, query: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  317. if '#query#' in prompt_template.variable_keys:
  318. if query:
  319. prompt_inputs['#query#'] = query
  320. else:
  321. prompt_inputs['#query#'] = ''
  322. def _set_histories_variable(self, memory: TokenBufferMemory,
  323. raw_prompt: str,
  324. role_prefix: AdvancedCompletionPromptTemplateEntity.RolePrefixEntity,
  325. prompt_template: PromptTemplateParser,
  326. prompt_inputs: dict,
  327. model_config: ModelConfigEntity) -> None:
  328. if '#histories#' in prompt_template.variable_keys:
  329. if memory:
  330. tmp_human_message = UserPromptMessage(
  331. content=PromptBuilder.parse_prompt(
  332. prompt=raw_prompt,
  333. inputs={'#histories#': '', **prompt_inputs}
  334. )
  335. )
  336. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  337. histories = self._get_history_messages_from_memory(
  338. memory=memory,
  339. max_token_limit=rest_tokens,
  340. human_prefix=role_prefix.user,
  341. ai_prefix=role_prefix.assistant
  342. )
  343. prompt_inputs['#histories#'] = histories
  344. else:
  345. prompt_inputs['#histories#'] = ''
  346. def _append_chat_histories(self, memory: TokenBufferMemory,
  347. prompt_messages: list[PromptMessage],
  348. model_config: ModelConfigEntity) -> None:
  349. if memory:
  350. rest_tokens = self._calculate_rest_token(prompt_messages, model_config)
  351. histories = self._get_history_messages_list_from_memory(memory, rest_tokens)
  352. prompt_messages.extend(histories)
  353. def _calculate_rest_token(self, prompt_messages: list[PromptMessage], model_config: ModelConfigEntity) -> int:
  354. rest_tokens = 2000
  355. model_context_tokens = model_config.model_schema.model_properties.get(ModelPropertyKey.CONTEXT_SIZE)
  356. if model_context_tokens:
  357. model_type_instance = model_config.provider_model_bundle.model_type_instance
  358. model_type_instance = cast(LargeLanguageModel, model_type_instance)
  359. curr_message_tokens = model_type_instance.get_num_tokens(
  360. model_config.model,
  361. model_config.credentials,
  362. prompt_messages
  363. )
  364. max_tokens = 0
  365. for parameter_rule in model_config.model_schema.parameter_rules:
  366. if (parameter_rule.name == 'max_tokens'
  367. or (parameter_rule.use_template and parameter_rule.use_template == 'max_tokens')):
  368. max_tokens = (model_config.parameters.get(parameter_rule.name)
  369. or model_config.parameters.get(parameter_rule.use_template)) or 0
  370. rest_tokens = model_context_tokens - max_tokens - curr_message_tokens
  371. rest_tokens = max(rest_tokens, 0)
  372. return rest_tokens
  373. def _format_prompt(self, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> str:
  374. prompt = prompt_template.format(
  375. prompt_inputs
  376. )
  377. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  378. return prompt
  379. def _get_chat_app_completion_model_prompt_messages(self,
  380. prompt_template_entity: PromptTemplateEntity,
  381. inputs: dict,
  382. query: str,
  383. files: list[FileObj],
  384. context: Optional[str],
  385. memory: Optional[TokenBufferMemory],
  386. model_config: ModelConfigEntity) -> list[PromptMessage]:
  387. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  388. role_prefix = prompt_template_entity.advanced_completion_prompt_template.role_prefix
  389. prompt_messages = []
  390. prompt_template = PromptTemplateParser(template=raw_prompt)
  391. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  392. self._set_context_variable(context, prompt_template, prompt_inputs)
  393. self._set_query_variable(query, prompt_template, prompt_inputs)
  394. self._set_histories_variable(
  395. memory=memory,
  396. raw_prompt=raw_prompt,
  397. role_prefix=role_prefix,
  398. prompt_template=prompt_template,
  399. prompt_inputs=prompt_inputs,
  400. model_config=model_config
  401. )
  402. prompt = self._format_prompt(prompt_template, prompt_inputs)
  403. if files:
  404. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  405. for file in files:
  406. prompt_message_contents.append(file.prompt_message_content)
  407. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  408. else:
  409. prompt_messages.append(UserPromptMessage(content=prompt))
  410. return prompt_messages
  411. def _get_chat_app_chat_model_prompt_messages(self,
  412. prompt_template_entity: PromptTemplateEntity,
  413. inputs: dict,
  414. query: str,
  415. files: list[FileObj],
  416. context: Optional[str],
  417. memory: Optional[TokenBufferMemory],
  418. model_config: ModelConfigEntity) -> list[PromptMessage]:
  419. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  420. prompt_messages = []
  421. for prompt_item in raw_prompt_list:
  422. raw_prompt = prompt_item.text
  423. prompt_template = PromptTemplateParser(template=raw_prompt)
  424. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  425. self._set_context_variable(context, prompt_template, prompt_inputs)
  426. prompt = self._format_prompt(prompt_template, prompt_inputs)
  427. if prompt_item.role == PromptMessageRole.USER:
  428. prompt_messages.append(UserPromptMessage(content=prompt))
  429. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  430. prompt_messages.append(SystemPromptMessage(content=prompt))
  431. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  432. prompt_messages.append(AssistantPromptMessage(content=prompt))
  433. self._append_chat_histories(memory, prompt_messages, model_config)
  434. if files:
  435. prompt_message_contents = [TextPromptMessageContent(data=query)]
  436. for file in files:
  437. prompt_message_contents.append(file.prompt_message_content)
  438. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  439. else:
  440. prompt_messages.append(UserPromptMessage(content=query))
  441. return prompt_messages
  442. def _get_completion_app_completion_model_prompt_messages(self,
  443. prompt_template_entity: PromptTemplateEntity,
  444. inputs: dict,
  445. context: Optional[str]) -> list[PromptMessage]:
  446. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  447. prompt_messages = []
  448. prompt_template = PromptTemplateParser(template=raw_prompt)
  449. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  450. self._set_context_variable(context, prompt_template, prompt_inputs)
  451. prompt = self._format_prompt(prompt_template, prompt_inputs)
  452. prompt_messages.append(UserPromptMessage(content=prompt))
  453. return prompt_messages
  454. def _get_completion_app_chat_model_prompt_messages(self,
  455. prompt_template_entity: PromptTemplateEntity,
  456. inputs: dict,
  457. files: list[FileObj],
  458. context: Optional[str]) -> list[PromptMessage]:
  459. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  460. prompt_messages = []
  461. for prompt_item in raw_prompt_list:
  462. raw_prompt = prompt_item.text
  463. prompt_template = PromptTemplateParser(template=raw_prompt)
  464. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  465. self._set_context_variable(context, prompt_template, prompt_inputs)
  466. prompt = self._format_prompt(prompt_template, prompt_inputs)
  467. if prompt_item.role == PromptMessageRole.USER:
  468. prompt_messages.append(UserPromptMessage(content=prompt))
  469. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  470. prompt_messages.append(SystemPromptMessage(content=prompt))
  471. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  472. prompt_messages.append(AssistantPromptMessage(content=prompt))
  473. for prompt_message in prompt_messages[::-1]:
  474. if prompt_message.role == PromptMessageRole.USER:
  475. if files:
  476. prompt_message_contents = [TextPromptMessageContent(data=prompt_message.content)]
  477. for file in files:
  478. prompt_message_contents.append(file.prompt_message_content)
  479. prompt_message.content = prompt_message_contents
  480. break
  481. return prompt_messages