mirror of
https://github.com/mii443/tokenizers.git
synced 2025-08-22 16:25:30 +00:00
Wrap rustdoc html entity in code block (#1130)
This commit is contained in:
@ -14,7 +14,7 @@ use serde::{Deserialize, Serialize};
|
|||||||
pub struct CTC {
|
pub struct CTC {
|
||||||
/// The pad token used by CTC to delimit a new token.
|
/// The pad token used by CTC to delimit a new token.
|
||||||
pub pad_token: String,
|
pub pad_token: String,
|
||||||
/// The word delimiter token. It will be replaced by a <space>
|
/// The word delimiter token. It will be replaced by a `<space>`.
|
||||||
pub word_delimiter_token: String,
|
pub word_delimiter_token: String,
|
||||||
/// Whether to cleanup some tokenization artifacts.
|
/// Whether to cleanup some tokenization artifacts.
|
||||||
/// Mainly spaces before punctuation, and some abbreviated english forms.
|
/// Mainly spaces before punctuation, and some abbreviated english forms.
|
||||||
|
Reference in New Issue
Block a user