We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 043e7c4 commit 4be8a07Copy full SHA for 4be8a07
src/deepsparse/transformers/pipelines/text_generation.py
@@ -834,7 +834,7 @@ def engine_forward(
834
generated_tokens.append(token)
835
generated_logits.append(logits)
836
837
- if session.total_num_processed_tokens >= session.capacity:
+ if session.total_num_processed_tokens > session.capacity:
838
# if the kv cache is full, stop generation
839
finished_reason.append(FinishReason.CAPACITY)
840
break
0 commit comments