We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 89164cb commit b17af98Copy full SHA for b17af98
src/deepsparse/v2/text_generation/prep_for_single_engine.py
@@ -39,7 +39,7 @@ def can_operate(self, inp: Any, context: Context, inference_state: InferenceStat
39
kv_cache = inp.get("kv_cache")
40
tokens = inp.get("tokens")
41
# if 0 prompt tokens remain, can't operate (multi-token engine has already run)
42
- if len(tokens) == kv_cache.total_num_processed_tokens == 0:
+ if len(tokens) == kv_cache.total_num_processed_tokens:
43
return False
44
45
# if number of prompt tokens left to process is >= self.prompt_sequnce_length
0 commit comments