Unverified Commit bd3a9b2f authored by takatost's avatar takatost Committed by GitHub

fix: xinference-chat-stream-response (#991)

parent 18d38771
......@@ -123,7 +123,12 @@ class XinferenceLLM(Xinference):
if choices:
choice = choices[0]
if isinstance(choice, dict):
if 'text' in choice:
token = choice.get("text", "")
elif 'delta' in choice and 'content' in choice['delta']:
token = choice.get('delta').get('content')
else:
continue
log_probs = choice.get("logprobs")
if run_manager:
run_manager.on_llm_new_token(
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment