Now the last token sent when stream=True

This commit is contained in:
Carlos Tejada 2023-07-19 22:47:14 -04:00
parent 36872620d0
commit 0756a2d3fb

View file

@ -953,7 +953,7 @@ class Llama:
token_end_position += len(self.detokenize([token]))
# Check if stop sequence is in the token
if token_end_position >= (
remaining_length - first_stop_position - 1
remaining_length - first_stop_position
):
break
logprobs_or_none: Optional[CompletionLogprobs] = None