We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
2 parents 054c196 + 4ec593d commit 236c791Copy full SHA for 236c791
megatron/inference/text_generation/tokenization.py
@@ -35,6 +35,8 @@ def detokenize_generations(tokens_gpu_tensor,
35
'HuggingFaceTokenizer',
36
'Llama2Tokenizer']:
37
word = tokenizer.decoder[token]
38
+ elif args.tokenizer_type == 'TikTokenizer':
39
+ word = tokenizer.detokenize([token])
40
elif args.tokenizer_type in ['Llama3Tokenizer', 'MistralTokenizer']:
41
word = tokenizer.decode([token])
42
elif args.tokenizer_type == 'NullTokenizer':
0 commit comments