We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
stream=True
1 parent 3687262 commit 0756a2dCopy full SHA for 0756a2d
llama_cpp/llama.py
@@ -953,7 +953,7 @@ def _create_completion(
953
token_end_position += len(self.detokenize([token]))
954
# Check if stop sequence is in the token
955
if token_end_position >= (
956
- remaining_length - first_stop_position - 1
+ remaining_length - first_stop_position
957
):
958
break
959
logprobs_or_none: Optional[CompletionLogprobs] = None
0 commit comments