fix: max token not exist in generate summary when calc rest tokens (#891)
This commit is contained in:
@@ -51,6 +51,7 @@ class LLMGenerator:
|
|||||||
prompt_with_empty_context = prompt.format(context='')
|
prompt_with_empty_context = prompt.format(context='')
|
||||||
prompt_tokens = model_instance.get_num_tokens([PromptMessage(content=prompt_with_empty_context)])
|
prompt_tokens = model_instance.get_num_tokens([PromptMessage(content=prompt_with_empty_context)])
|
||||||
max_context_token_length = model_instance.model_rules.max_tokens.max
|
max_context_token_length = model_instance.model_rules.max_tokens.max
|
||||||
|
max_context_token_length = max_context_token_length if max_context_token_length else 1500
|
||||||
rest_tokens = max_context_token_length - prompt_tokens - max_tokens - 1
|
rest_tokens = max_context_token_length - prompt_tokens - max_tokens - 1
|
||||||
|
|
||||||
context = ''
|
context = ''
|
||||||
|
Reference in New Issue
Block a user