Use a smaller train file.

This commit is contained in:
Nicolas Patry
2020-09-02 15:07:39 +02:00
committed by Anthony MOI
parent 7acbb1122e
commit d0366529b7
2 changed files with 4 additions and 1 deletions

View File

@ -65,6 +65,9 @@ def train_files(data_dir):
"wagahaiwa": download(
"https://storage.googleapis.com/tokenizers/unigram_wagahaiwa_nekodearu.txt"
),
"simple": download(
"https://s3.amazonaws.com/models.huggingface.co/bert/roberta-base-merges.txt"
),
}