Doc - Improve snippets testing

This commit is contained in:
Anthony MOI
2020-10-02 15:52:33 -04:00
committed by Anthony MOI
parent f4e7754112
commit 000c19a7a5
12 changed files with 84 additions and 68 deletions

View File

@ -9,8 +9,6 @@ class TestByteLevelBPE:
tokenizer = ByteLevelBPETokenizer.from_file(roberta_files["vocab"], roberta_files["merges"])
output = tokenizer.encode("The quick brown fox jumps over the lazy dog")
tokenizer.save("roberta.json")
assert output.ids == [133, 2119, 6219, 23602, 13855, 81, 5, 22414, 2335]
assert output.tokens == [
"The",