fix: xinference chat completion error (#952)

4f3053a8 · takatost · GitHub · b3c2bf12 · 4f3053a8
Unverified Commit 4f3053a8 authored Aug 22, 2023 by takatost Committed by GitHub Aug 22, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 2 additions and 2 deletions

xinference_llm.py api/core/third_party/langchain/llms/xinference_llm.py +2 -2

No files found.
--- a/api/core/third_party/langchain/llms/xinference_llm.py
+++ b/api/core/third_party/langchain/llms/xinference_llm.py
@@ -46,7 +46,7 @@ class XinferenceLLM(Xinference):
                return combined_text_output
            else:
                completion = model.chat(prompt=prompt, generate_config=generate_config)
-                return completion["choices"][0]["text"]
+                return completion["choices"][0]["message"]["content"]
        elif isinstance(model, RESTfulGenerateModelHandle):
            generate_config: "LlamaCppGenerateConfig" = kwargs.get("generate_config", {})
@@ -82,7 +82,7 @@ class XinferenceLLM(Xinference):
                completion = combined_text_output
            else:
                completion = model.chat(prompt=prompt, generate_config=generate_config)
-                completion = completion["choices"][0]["text"]
+                completion = completion["choices"][0]["message"]["content"]
            if stop is not None:
                completion = enforce_stop_tokens(completion, stop)