mirror of
https://github.com/mii443/tokenizers.git
synced 2025-08-22 16:25:30 +00:00
Fix stride condition. (#1321)
* Release all at once for simplicity. * rc2
This commit is contained in:
@ -1,4 +1,4 @@
|
||||
__version__ = "0.13.4.rc1"
|
||||
__version__ = "0.13.4.rc2"
|
||||
|
||||
from enum import Enum
|
||||
from typing import List, Tuple, Union
|
||||
|
@ -9,7 +9,7 @@ extras["dev"] = extras["testing"]
|
||||
|
||||
setup(
|
||||
name="tokenizers",
|
||||
version="0.13.4.rc1",
|
||||
version="0.13.4.rc2",
|
||||
description="Fast and Customizable Tokenizers",
|
||||
long_description=open("README.md", "r", encoding="utf-8").read(),
|
||||
long_description_content_type="text/markdown",
|
||||
|
@ -605,7 +605,7 @@ where
|
||||
if let Some(trunc_params) = &trunc {
|
||||
let n_added_tokens = self.get_n_added_tokens(false);
|
||||
let effective_max_length = trunc_params.max_length - n_added_tokens;
|
||||
if effective_max_length <= trunc_params.stride {
|
||||
if effective_max_length < trunc_params.stride {
|
||||
return Err(Box::new(TruncationParamError(format!(
|
||||
"tokenizer stride set to {}, which is greater than or equal to its effective max length of {} (= {} original max length - {} added special tokens), ",
|
||||
trunc_params.stride, effective_max_length, trunc_params.max_length, n_added_tokens
|
||||
|
Reference in New Issue
Block a user