[MINOR:TYPO] Fix docstrings (#1653)

* [MINOR:TYPO] Update pre_tokenizers.rs * [MINOR:TYPO] Update __init__.pyi
2025-12-03 03:08:21 +00:00 · 2024-11-05 16:25:06 +01:00
parent 5e223ceb48
commit 57884ebaa2
2 changed files with 2 additions and 2 deletions
--- a/bindings/python/py_src/tokenizers/pre_tokenizers/init.pyi
+++ b/bindings/python/py_src/tokenizers/pre_tokenizers/init.pyi
@@ -421,7 +421,7 @@ class Split(PreTokenizer):
    Args:
        pattern (:obj:`str` or :class:`~tokenizers.Regex`):
-            A pattern used to split the string. Usually a string or a a regex built with `tokenizers.Regex`.
+            A pattern used to split the string. Usually a string or a regex built with `tokenizers.Regex`.
            If you want to use a regex pattern, it has to be wrapped around a `tokenizer.Regex`,
            otherwise we consider is as a string pattern. For example `pattern="|"`
            means you want to split on `|` (imagine a csv file for example), while
--- a/bindings/python/src/pre_tokenizers.rs
+++ b/bindings/python/src/pre_tokenizers.rs
@@ -334,7 +334,7 @@ impl PyWhitespaceSplit {
 ///
 /// Args:
 ///     pattern (:obj:`str` or :class:`~tokenizers.Regex`):
-///         A pattern used to split the string. Usually a string or a a regex built with `tokenizers.Regex`.
+///         A pattern used to split the string. Usually a string or a regex built with `tokenizers.Regex`.
 ///         If you want to use a regex pattern, it has to be wrapped around a `tokenizer.Regex`,
 ///         otherwise we consider is as a string pattern. For example `pattern="|"`
 ///         means you want to split on `|` (imagine a csv file for example), while