fix: max token not exist in generate summary when calc rest tokens (#891)

2f7b234c · takatost · GitHub · 4f5f9506 · 2f7b234c
Unverified Commit 2f7b234c authored Aug 17, 2023 by takatost Committed by GitHub Aug 17, 2023
Hide whitespace changes
Inline Side-by-side

Showing with 1 addition and 0 deletions

llm_generator.py api/core/generator/llm_generator.py +1 -0

No files found.
--- a/api/core/generator/llm_generator.py
+++ b/api/core/generator/llm_generator.py
@@ -51,6 +51,7 @@ class LLMGenerator:
        prompt_with_empty_context = prompt.format(context='')
        prompt_tokens = model_instance.get_num_tokens([PromptMessage(content=prompt_with_empty_context)])
        max_context_token_length = model_instance.model_rules.max_tokens.max
+        max_context_token_length = max_context_token_length if max_context_token_length else 1500
        rest_tokens = max_context_token_length - prompt_tokens - max_tokens - 1
        context = ''