File tree 2 files changed +2
-2
lines changed
2 files changed +2
-2
lines changed Original file line number Diff line number Diff line change @@ -351,4 +351,4 @@ def detokenize(self, ids):
351
351
Returns:
352
352
str: Decoded string.
353
353
"""
354
- return self .tokenizer .decode (ids , skip_special_tokens = True )
354
+ return self .tokenizer .decode (ids )
Original file line number Diff line number Diff line change @@ -781,7 +781,7 @@ def load_tokenizer(self):
781
781
self .decode = lambda l : '' .join ([self .itos [i ] for i in l ])
782
782
elif 'tokenizer' in meta and meta ['tokenizer' ] == 'qwen2' :
783
783
tokenizer = AutoTokenizer .from_pretrained (meta ["qwen2_model" ], trust_remote_code = True )
784
- self .encode = lambda s : tokenizer .encode (s , add_special_tokens = False )
784
+ self .encode = lambda s : tokenizer .encode (s , add_special_tokens = True )
785
785
self .decode = lambda l : tokenizer .decode (l )
786
786
print (f"Using Qwen2 tokenizer: { meta ['qwen2_model' ]} " )
787
787
elif 'tokenizer' in meta and meta ['tokenizer' ] == 'custom_char_with_byte_fallback' :
You can’t perform that action at this time.
0 commit comments