Prechádzať zdrojové kódy

fix: xinference-chat-stream-response (#991)

takatost 1 rok pred
rodič
commit
bd3a9b2f8d

+ 6 - 1
api/core/third_party/langchain/llms/xinference_llm.py

@@ -123,7 +123,12 @@ class XinferenceLLM(Xinference):
                 if choices:
                     choice = choices[0]
                     if isinstance(choice, dict):
-                        token = choice.get("text", "")
+                        if 'text' in choice:
+                            token = choice.get("text", "")
+                        elif 'delta' in choice and 'content' in choice['delta']:
+                            token = choice.get('delta').get('content')
+                        else:
+                            continue
                         log_probs = choice.get("logprobs")
                         if run_manager:
                             run_manager.on_llm_new_token(