mirror of
https://github.com/mii443/tokenizers.git
synced 2025-12-04 03:38:23 +00:00
Python - Add bindings for some Model methods
This commit is contained in:
@@ -2,6 +2,7 @@ use std::collections::HashMap;
|
||||
use std::path::{Path, PathBuf};
|
||||
use std::sync::Arc;
|
||||
|
||||
use crate::token::PyToken;
|
||||
use pyo3::exceptions;
|
||||
use pyo3::prelude::*;
|
||||
use pyo3::types::*;
|
||||
@@ -105,6 +106,22 @@ impl PyModel {
|
||||
}
|
||||
}
|
||||
|
||||
fn tokenize(&self, tokens: &str) -> PyResult<Vec<PyToken>> {
|
||||
Ok(ToPyResult(self.model.tokenize(tokens))
|
||||
.into_py()?
|
||||
.into_iter()
|
||||
.map(|t| t.into())
|
||||
.collect())
|
||||
}
|
||||
|
||||
fn token_to_id(&self, token: &str) -> Option<u32> {
|
||||
self.model.token_to_id(token)
|
||||
}
|
||||
|
||||
fn id_to_token(&self, id: u32) -> Option<&str> {
|
||||
self.model.id_to_token(id)
|
||||
}
|
||||
|
||||
fn save(&self, folder: &str, name: Option<&str>) -> PyResult<Vec<String>> {
|
||||
let saved: PyResult<Vec<_>> = ToPyResult(self.model.save(Path::new(folder), name)).into();
|
||||
|
||||
|
||||
Reference in New Issue
Block a user