File tree 1 file changed +5
-1
lines changed
1 file changed +5
-1
lines changed Original file line number Diff line number Diff line change 2
2
from abc import ABC , abstractmethod
3
3
from typing import Optional
4
4
5
+ import tokenizers
6
+ from packaging import version
5
7
from tokenizers import Tokenizer
6
8
from tokenizers .decoders import DecodeStream
7
9
from transformers import PreTrainedTokenizerFast
@@ -43,8 +45,10 @@ def from_new_request(
43
45
# No tokenizer => skipping detokenization.
44
46
return IncrementalDetokenizer ()
45
47
46
- if isinstance (tokenizer , PreTrainedTokenizerFast ):
48
+ if (isinstance (tokenizer , PreTrainedTokenizerFast ) and version .parse (
49
+ tokenizers .__version__ ) >= version .parse ("0.21.1" )):
47
50
# Fast tokenizer => use tokenizers library DecodeStream.
51
+ # And only tokenizers >= 0.21.1 supports Fast Detokenizer.
48
52
return FastIncrementalDetokenizer (tokenizer , request )
49
53
50
54
# Fall back to slow python-based incremental detokenization.
You can’t perform that action at this time.
0 commit comments