prompt_transform.py 24 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581
  1. import json
  2. import os
  3. import re
  4. import enum
  5. from typing import List, Optional, Tuple, cast
  6. from core.entities.application_entities import ModelConfigEntity, PromptTemplateEntity, \
  7. AdvancedCompletionPromptTemplateEntity
  8. from core.file.file_obj import FileObj
  9. from core.memory.token_buffer_memory import TokenBufferMemory
  10. from core.model_runtime.entities.message_entities import PromptMessage, SystemPromptMessage, UserPromptMessage, \
  11. TextPromptMessageContent, PromptMessageRole, AssistantPromptMessage
  12. from core.model_runtime.entities.model_entities import ModelPropertyKey
  13. from core.model_runtime.model_providers.__base.large_language_model import LargeLanguageModel
  14. from core.prompt.prompt_builder import PromptBuilder
  15. from core.prompt.prompt_template import PromptTemplateParser
  16. class AppMode(enum.Enum):
  17. COMPLETION = 'completion'
  18. CHAT = 'chat'
  19. @classmethod
  20. def value_of(cls, value: str) -> 'AppMode':
  21. """
  22. Get value of given mode.
  23. :param value: mode value
  24. :return: mode
  25. """
  26. for mode in cls:
  27. if mode.value == value:
  28. return mode
  29. raise ValueError(f'invalid mode value {value}')
  30. class ModelMode(enum.Enum):
  31. COMPLETION = 'completion'
  32. CHAT = 'chat'
  33. @classmethod
  34. def value_of(cls, value: str) -> 'ModelMode':
  35. """
  36. Get value of given mode.
  37. :param value: mode value
  38. :return: mode
  39. """
  40. for mode in cls:
  41. if mode.value == value:
  42. return mode
  43. raise ValueError(f'invalid mode value {value}')
  44. class PromptTransform:
  45. def get_prompt(self,
  46. app_mode: str,
  47. prompt_template_entity: PromptTemplateEntity,
  48. inputs: dict,
  49. query: str,
  50. files: List[FileObj],
  51. context: Optional[str],
  52. memory: Optional[TokenBufferMemory],
  53. model_config: ModelConfigEntity) -> \
  54. Tuple[List[PromptMessage], Optional[List[str]]]:
  55. app_mode = AppMode.value_of(app_mode)
  56. model_mode = ModelMode.value_of(model_config.mode)
  57. prompt_rules = self._read_prompt_rules_from_file(self._prompt_file_name(
  58. app_mode=app_mode,
  59. provider=model_config.provider,
  60. model=model_config.model
  61. ))
  62. if app_mode == AppMode.CHAT and model_mode == ModelMode.CHAT:
  63. stops = None
  64. prompt_messages = self._get_simple_chat_app_chat_model_prompt_messages(
  65. prompt_rules=prompt_rules,
  66. pre_prompt=prompt_template_entity.simple_prompt_template,
  67. inputs=inputs,
  68. query=query,
  69. files=files,
  70. context=context,
  71. memory=memory,
  72. model_config=model_config
  73. )
  74. else:
  75. stops = prompt_rules.get('stops')
  76. if stops is not None and len(stops) == 0:
  77. stops = None
  78. prompt_messages = self._get_simple_others_prompt_messages(
  79. prompt_rules=prompt_rules,
  80. pre_prompt=prompt_template_entity.simple_prompt_template,
  81. inputs=inputs,
  82. query=query,
  83. files=files,
  84. context=context,
  85. memory=memory,
  86. model_config=model_config
  87. )
  88. return prompt_messages, stops
  89. def get_advanced_prompt(self, app_mode: str,
  90. prompt_template_entity: PromptTemplateEntity,
  91. inputs: dict,
  92. query: str,
  93. files: List[FileObj],
  94. context: Optional[str],
  95. memory: Optional[TokenBufferMemory],
  96. model_config: ModelConfigEntity) -> List[PromptMessage]:
  97. app_mode = AppMode.value_of(app_mode)
  98. model_mode = ModelMode.value_of(model_config.mode)
  99. prompt_messages = []
  100. if app_mode == AppMode.CHAT:
  101. if model_mode == ModelMode.COMPLETION:
  102. prompt_messages = self._get_chat_app_completion_model_prompt_messages(
  103. prompt_template_entity=prompt_template_entity,
  104. inputs=inputs,
  105. query=query,
  106. files=files,
  107. context=context,
  108. memory=memory,
  109. model_config=model_config
  110. )
  111. elif model_mode == ModelMode.CHAT:
  112. prompt_messages = self._get_chat_app_chat_model_prompt_messages(
  113. prompt_template_entity=prompt_template_entity,
  114. inputs=inputs,
  115. query=query,
  116. files=files,
  117. context=context,
  118. memory=memory,
  119. model_config=model_config
  120. )
  121. elif app_mode == AppMode.COMPLETION:
  122. if model_mode == ModelMode.CHAT:
  123. prompt_messages = self._get_completion_app_chat_model_prompt_messages(
  124. prompt_template_entity=prompt_template_entity,
  125. inputs=inputs,
  126. files=files,
  127. context=context,
  128. )
  129. elif model_mode == ModelMode.COMPLETION:
  130. prompt_messages = self._get_completion_app_completion_model_prompt_messages(
  131. prompt_template_entity=prompt_template_entity,
  132. inputs=inputs,
  133. context=context,
  134. )
  135. return prompt_messages
  136. def _get_history_messages_from_memory(self, memory: TokenBufferMemory,
  137. max_token_limit: int,
  138. human_prefix: Optional[str] = None,
  139. ai_prefix: Optional[str] = None) -> str:
  140. """Get memory messages."""
  141. kwargs = {
  142. "max_token_limit": max_token_limit
  143. }
  144. if human_prefix:
  145. kwargs['human_prefix'] = human_prefix
  146. if ai_prefix:
  147. kwargs['ai_prefix'] = ai_prefix
  148. return memory.get_history_prompt_text(
  149. **kwargs
  150. )
  151. def _get_history_messages_list_from_memory(self, memory: TokenBufferMemory,
  152. max_token_limit: int) -> List[PromptMessage]:
  153. """Get memory messages."""
  154. return memory.get_history_prompt_messages(
  155. max_token_limit=max_token_limit
  156. )
  157. def _prompt_file_name(self, app_mode: AppMode, provider: str, model: str) -> str:
  158. # baichuan
  159. if provider == 'baichuan':
  160. return self._prompt_file_name_for_baichuan(app_mode)
  161. baichuan_supported_providers = ["huggingface_hub", "openllm", "xinference"]
  162. if provider in baichuan_supported_providers and 'baichuan' in model.lower():
  163. return self._prompt_file_name_for_baichuan(app_mode)
  164. # common
  165. if app_mode == AppMode.COMPLETION:
  166. return 'common_completion'
  167. else:
  168. return 'common_chat'
  169. def _prompt_file_name_for_baichuan(self, app_mode: AppMode) -> str:
  170. if app_mode == AppMode.COMPLETION:
  171. return 'baichuan_completion'
  172. else:
  173. return 'baichuan_chat'
  174. def _read_prompt_rules_from_file(self, prompt_name: str) -> dict:
  175. # Get the absolute path of the subdirectory
  176. prompt_path = os.path.join(
  177. os.path.dirname(os.path.realpath(__file__)),
  178. 'generate_prompts')
  179. json_file_path = os.path.join(prompt_path, f'{prompt_name}.json')
  180. # Open the JSON file and read its content
  181. with open(json_file_path, 'r', encoding='utf-8') as json_file:
  182. return json.load(json_file)
  183. def _get_simple_chat_app_chat_model_prompt_messages(self, prompt_rules: dict,
  184. pre_prompt: str,
  185. inputs: dict,
  186. query: str,
  187. context: Optional[str],
  188. files: List[FileObj],
  189. memory: Optional[TokenBufferMemory],
  190. model_config: ModelConfigEntity) -> List[PromptMessage]:
  191. prompt_messages = []
  192. context_prompt_content = ''
  193. if context and 'context_prompt' in prompt_rules:
  194. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  195. context_prompt_content = prompt_template.format(
  196. {'context': context}
  197. )
  198. pre_prompt_content = ''
  199. if pre_prompt:
  200. prompt_template = PromptTemplateParser(template=pre_prompt)
  201. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  202. pre_prompt_content = prompt_template.format(
  203. prompt_inputs
  204. )
  205. prompt = ''
  206. for order in prompt_rules['system_prompt_orders']:
  207. if order == 'context_prompt':
  208. prompt += context_prompt_content
  209. elif order == 'pre_prompt':
  210. prompt += pre_prompt_content
  211. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  212. if prompt:
  213. prompt_messages.append(SystemPromptMessage(content=prompt))
  214. self._append_chat_histories(
  215. memory=memory,
  216. prompt_messages=prompt_messages,
  217. model_config=model_config
  218. )
  219. if files:
  220. prompt_message_contents = [TextPromptMessageContent(data=query)]
  221. for file in files:
  222. prompt_message_contents.append(file.prompt_message_content)
  223. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  224. else:
  225. prompt_messages.append(UserPromptMessage(content=query))
  226. return prompt_messages
  227. def _get_simple_others_prompt_messages(self, prompt_rules: dict,
  228. pre_prompt: str,
  229. inputs: dict,
  230. query: str,
  231. context: Optional[str],
  232. memory: Optional[TokenBufferMemory],
  233. files: List[FileObj],
  234. model_config: ModelConfigEntity) -> List[PromptMessage]:
  235. context_prompt_content = ''
  236. if context and 'context_prompt' in prompt_rules:
  237. prompt_template = PromptTemplateParser(template=prompt_rules['context_prompt'])
  238. context_prompt_content = prompt_template.format(
  239. {'context': context}
  240. )
  241. pre_prompt_content = ''
  242. if pre_prompt:
  243. prompt_template = PromptTemplateParser(template=pre_prompt)
  244. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  245. pre_prompt_content = prompt_template.format(
  246. prompt_inputs
  247. )
  248. prompt = ''
  249. for order in prompt_rules['system_prompt_orders']:
  250. if order == 'context_prompt':
  251. prompt += context_prompt_content
  252. elif order == 'pre_prompt':
  253. prompt += pre_prompt_content
  254. query_prompt = prompt_rules['query_prompt'] if 'query_prompt' in prompt_rules else '{{query}}'
  255. if memory and 'histories_prompt' in prompt_rules:
  256. # append chat histories
  257. tmp_human_message = UserPromptMessage(
  258. content=PromptBuilder.parse_prompt(
  259. prompt=prompt + query_prompt,
  260. inputs={
  261. 'query': query
  262. }
  263. )
  264. )
  265. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  266. histories = self._get_history_messages_from_memory(
  267. memory=memory,
  268. max_token_limit=rest_tokens,
  269. ai_prefix=prompt_rules['human_prefix'] if 'human_prefix' in prompt_rules else 'Human',
  270. human_prefix=prompt_rules['assistant_prefix'] if 'assistant_prefix' in prompt_rules else 'Assistant'
  271. )
  272. prompt_template = PromptTemplateParser(template=prompt_rules['histories_prompt'])
  273. histories_prompt_content = prompt_template.format({'histories': histories})
  274. prompt = ''
  275. for order in prompt_rules['system_prompt_orders']:
  276. if order == 'context_prompt':
  277. prompt += context_prompt_content
  278. elif order == 'pre_prompt':
  279. prompt += (pre_prompt_content + '\n') if pre_prompt_content else ''
  280. elif order == 'histories_prompt':
  281. prompt += histories_prompt_content
  282. prompt_template = PromptTemplateParser(template=query_prompt)
  283. query_prompt_content = prompt_template.format({'query': query})
  284. prompt += query_prompt_content
  285. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  286. model_mode = ModelMode.value_of(model_config.mode)
  287. if model_mode == ModelMode.CHAT and files:
  288. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  289. for file in files:
  290. prompt_message_contents.append(file.prompt_message_content)
  291. prompt_message = UserPromptMessage(content=prompt_message_contents)
  292. else:
  293. if files:
  294. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  295. for file in files:
  296. prompt_message_contents.append(file.prompt_message_content)
  297. prompt_message = UserPromptMessage(content=prompt_message_contents)
  298. else:
  299. prompt_message = UserPromptMessage(content=prompt)
  300. return [prompt_message]
  301. def _set_context_variable(self, context: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  302. if '#context#' in prompt_template.variable_keys:
  303. if context:
  304. prompt_inputs['#context#'] = context
  305. else:
  306. prompt_inputs['#context#'] = ''
  307. def _set_query_variable(self, query: str, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> None:
  308. if '#query#' in prompt_template.variable_keys:
  309. if query:
  310. prompt_inputs['#query#'] = query
  311. else:
  312. prompt_inputs['#query#'] = ''
  313. def _set_histories_variable(self, memory: TokenBufferMemory,
  314. raw_prompt: str,
  315. role_prefix: AdvancedCompletionPromptTemplateEntity.RolePrefixEntity,
  316. prompt_template: PromptTemplateParser,
  317. prompt_inputs: dict,
  318. model_config: ModelConfigEntity) -> None:
  319. if '#histories#' in prompt_template.variable_keys:
  320. if memory:
  321. tmp_human_message = UserPromptMessage(
  322. content=PromptBuilder.parse_prompt(
  323. prompt=raw_prompt,
  324. inputs={'#histories#': '', **prompt_inputs}
  325. )
  326. )
  327. rest_tokens = self._calculate_rest_token([tmp_human_message], model_config)
  328. histories = self._get_history_messages_from_memory(
  329. memory=memory,
  330. max_token_limit=rest_tokens,
  331. human_prefix=role_prefix.user,
  332. ai_prefix=role_prefix.assistant
  333. )
  334. prompt_inputs['#histories#'] = histories
  335. else:
  336. prompt_inputs['#histories#'] = ''
  337. def _append_chat_histories(self, memory: TokenBufferMemory,
  338. prompt_messages: list[PromptMessage],
  339. model_config: ModelConfigEntity) -> None:
  340. if memory:
  341. rest_tokens = self._calculate_rest_token(prompt_messages, model_config)
  342. histories = self._get_history_messages_list_from_memory(memory, rest_tokens)
  343. prompt_messages.extend(histories)
  344. def _calculate_rest_token(self, prompt_messages: list[PromptMessage], model_config: ModelConfigEntity) -> int:
  345. rest_tokens = 2000
  346. model_context_tokens = model_config.model_schema.model_properties.get(ModelPropertyKey.CONTEXT_SIZE)
  347. if model_context_tokens:
  348. model_type_instance = model_config.provider_model_bundle.model_type_instance
  349. model_type_instance = cast(LargeLanguageModel, model_type_instance)
  350. curr_message_tokens = model_type_instance.get_num_tokens(
  351. model_config.model,
  352. model_config.credentials,
  353. prompt_messages
  354. )
  355. max_tokens = 0
  356. for parameter_rule in model_config.model_schema.parameter_rules:
  357. if (parameter_rule.name == 'max_tokens'
  358. or (parameter_rule.use_template and parameter_rule.use_template == 'max_tokens')):
  359. max_tokens = (model_config.parameters.get(parameter_rule.name)
  360. or model_config.parameters.get(parameter_rule.use_template)) or 0
  361. rest_tokens = model_context_tokens - max_tokens - curr_message_tokens
  362. rest_tokens = max(rest_tokens, 0)
  363. return rest_tokens
  364. def _format_prompt(self, prompt_template: PromptTemplateParser, prompt_inputs: dict) -> str:
  365. prompt = prompt_template.format(
  366. prompt_inputs
  367. )
  368. prompt = re.sub(r'<\|.*?\|>', '', prompt)
  369. return prompt
  370. def _get_chat_app_completion_model_prompt_messages(self,
  371. prompt_template_entity: PromptTemplateEntity,
  372. inputs: dict,
  373. query: str,
  374. files: List[FileObj],
  375. context: Optional[str],
  376. memory: Optional[TokenBufferMemory],
  377. model_config: ModelConfigEntity) -> List[PromptMessage]:
  378. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  379. role_prefix = prompt_template_entity.advanced_completion_prompt_template.role_prefix
  380. prompt_messages = []
  381. prompt_template = PromptTemplateParser(template=raw_prompt)
  382. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  383. self._set_context_variable(context, prompt_template, prompt_inputs)
  384. self._set_query_variable(query, prompt_template, prompt_inputs)
  385. self._set_histories_variable(
  386. memory=memory,
  387. raw_prompt=raw_prompt,
  388. role_prefix=role_prefix,
  389. prompt_template=prompt_template,
  390. prompt_inputs=prompt_inputs,
  391. model_config=model_config
  392. )
  393. prompt = self._format_prompt(prompt_template, prompt_inputs)
  394. if files:
  395. prompt_message_contents = [TextPromptMessageContent(data=prompt)]
  396. for file in files:
  397. prompt_message_contents.append(file.prompt_message_content)
  398. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  399. else:
  400. prompt_messages.append(UserPromptMessage(content=prompt))
  401. return prompt_messages
  402. def _get_chat_app_chat_model_prompt_messages(self,
  403. prompt_template_entity: PromptTemplateEntity,
  404. inputs: dict,
  405. query: str,
  406. files: List[FileObj],
  407. context: Optional[str],
  408. memory: Optional[TokenBufferMemory],
  409. model_config: ModelConfigEntity) -> List[PromptMessage]:
  410. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  411. prompt_messages = []
  412. for prompt_item in raw_prompt_list:
  413. raw_prompt = prompt_item.text
  414. prompt_template = PromptTemplateParser(template=raw_prompt)
  415. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  416. self._set_context_variable(context, prompt_template, prompt_inputs)
  417. prompt = self._format_prompt(prompt_template, prompt_inputs)
  418. if prompt_item.role == PromptMessageRole.USER:
  419. prompt_messages.append(UserPromptMessage(content=prompt))
  420. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  421. prompt_messages.append(SystemPromptMessage(content=prompt))
  422. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  423. prompt_messages.append(AssistantPromptMessage(content=prompt))
  424. self._append_chat_histories(memory, prompt_messages, model_config)
  425. if files:
  426. prompt_message_contents = [TextPromptMessageContent(data=query)]
  427. for file in files:
  428. prompt_message_contents.append(file.prompt_message_content)
  429. prompt_messages.append(UserPromptMessage(content=prompt_message_contents))
  430. else:
  431. prompt_messages.append(UserPromptMessage(content=query))
  432. return prompt_messages
  433. def _get_completion_app_completion_model_prompt_messages(self,
  434. prompt_template_entity: PromptTemplateEntity,
  435. inputs: dict,
  436. context: Optional[str]) -> List[PromptMessage]:
  437. raw_prompt = prompt_template_entity.advanced_completion_prompt_template.prompt
  438. prompt_messages = []
  439. prompt_template = PromptTemplateParser(template=raw_prompt)
  440. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  441. self._set_context_variable(context, prompt_template, prompt_inputs)
  442. prompt = self._format_prompt(prompt_template, prompt_inputs)
  443. prompt_messages.append(UserPromptMessage(content=prompt))
  444. return prompt_messages
  445. def _get_completion_app_chat_model_prompt_messages(self,
  446. prompt_template_entity: PromptTemplateEntity,
  447. inputs: dict,
  448. files: List[FileObj],
  449. context: Optional[str]) -> List[PromptMessage]:
  450. raw_prompt_list = prompt_template_entity.advanced_chat_prompt_template.messages
  451. prompt_messages = []
  452. for prompt_item in raw_prompt_list:
  453. raw_prompt = prompt_item.text
  454. prompt_template = PromptTemplateParser(template=raw_prompt)
  455. prompt_inputs = {k: inputs[k] for k in prompt_template.variable_keys if k in inputs}
  456. self._set_context_variable(context, prompt_template, prompt_inputs)
  457. prompt = self._format_prompt(prompt_template, prompt_inputs)
  458. if prompt_item.role == PromptMessageRole.USER:
  459. prompt_messages.append(UserPromptMessage(content=prompt))
  460. elif prompt_item.role == PromptMessageRole.SYSTEM and prompt:
  461. prompt_messages.append(SystemPromptMessage(content=prompt))
  462. elif prompt_item.role == PromptMessageRole.ASSISTANT:
  463. prompt_messages.append(AssistantPromptMessage(content=prompt))
  464. for prompt_message in prompt_messages[::-1]:
  465. if prompt_message.role == PromptMessageRole.USER:
  466. if files:
  467. prompt_message_contents = [TextPromptMessageContent(data=prompt_message.content)]
  468. for file in files:
  469. prompt_message_contents.append(file.prompt_message_content)
  470. prompt_message.content = prompt_message_contents
  471. break
  472. return prompt_messages