mirror of
https://github.com/mii443/tokenizers.git
synced 2025-12-07 13:18:31 +00:00
Fix typo in Python binding README
Trailing paren causes an error
This commit is contained in:
@@ -158,7 +158,7 @@ tokenizer = Tokenizer(models.BPE.empty())
|
|||||||
|
|
||||||
# Customize pre-tokenization and decoding
|
# Customize pre-tokenization and decoding
|
||||||
tokenizer.pre_tokenizer = pre_tokenizers.ByteLevel.new(add_prefix_space=True)
|
tokenizer.pre_tokenizer = pre_tokenizers.ByteLevel.new(add_prefix_space=True)
|
||||||
tokenizer.decoder = decoders.ByteLevel.new())
|
tokenizer.decoder = decoders.ByteLevel.new()
|
||||||
|
|
||||||
# And then train
|
# And then train
|
||||||
trainer = trainers.BpeTrainer.new(vocab_size=20000, min_frequency=2)
|
trainer = trainers.BpeTrainer.new(vocab_size=20000, min_frequency=2)
|
||||||
|
|||||||
Reference in New Issue
Block a user