Python - Test CharBPETokenizer

This commit is contained in:
Anthony MOI
2020-04-01 15:12:34 -04:00
parent dbc23e20a9
commit 7fd7dfd113
2 changed files with 56 additions and 0 deletions

View File

@ -44,3 +44,15 @@ def bert_files(data_dir):
"https://s3.amazonaws.com/models.huggingface.co/bert/bert-base-uncased-vocab.txt"
),
}
@pytest.fixture(scope="session")
def openai_files(data_dir):
return {
"vocab": download(
"https://s3.amazonaws.com/models.huggingface.co/bert/openai-gpt-vocab.json"
),
"merges": download(
"https://s3.amazonaws.com/models.huggingface.co/bert/openai-gpt-merges.txt"
),
}