Generate pyi, fix tests and clippy warnings

2025-12-08 21:58:18 +00:00 · 2020-11-19 17:57:58 -05:00
parent 5059be1a8d
commit 387b8a1033
7 changed files with 56 additions and 74 deletions
--- a/bindings/python/py_src/tokenizers/trainers/init.pyi
+++ b/bindings/python/py_src/tokenizers/trainers/init.pyi
@@ -83,6 +83,27 @@ class UnigramTrainer(Trainer):
    def __init__(self, vocab_size=8000, show_progress=True, special_tokens=[]):
        pass

+class WordLevelTrainer(Trainer):
+    """
+    Capable of training a WorldLevel model
+
+    Args:
+        vocab_size: unsigned int:
+            The size of the final vocabulary, including all tokens and alphabet.
+
+        min_frequency: unsigned int:
+            The minimum frequency a pair should have in order to be merged.
+
+        show_progress: boolean:
+            Whether to show progress bars while training.
+
+        special_tokens: List[Union[str, AddedToken]]:
+            A list of special tokens the model should know of.
+
+    Returns:
+        Trainer
+    """
+
 class WordPieceTrainer(Trainer):
    """
    Capable of training a WordPiece model