mirror of
https://github.com/mii443/tokenizers.git
synced 2025-08-23 00:35:35 +00:00
Python - Expose ByteLevel alphabet
This commit is contained in:
@ -50,6 +50,14 @@ impl ByteLevel {
|
|||||||
))),
|
))),
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
|
#[staticmethod]
|
||||||
|
fn alphabet() -> Vec<String> {
|
||||||
|
tk::pre_tokenizers::byte_level::ByteLevel::alphabet()
|
||||||
|
.into_iter()
|
||||||
|
.map(|c| c.to_string())
|
||||||
|
.collect()
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
#[pyclass]
|
#[pyclass]
|
||||||
|
Reference in New Issue
Block a user