pub struct EsmSequenceTokenizer { /* private fields */ }Implementations§
Source§impl EsmSequenceTokenizer
impl EsmSequenceTokenizer
Sourcepub fn tokenize_sequence(
&self,
sequence: &str,
add_special_tokens: bool,
) -> Vec<u32>
pub fn tokenize_sequence( &self, sequence: &str, add_special_tokens: bool, ) -> Vec<u32>
Tokenize an amino-acid sequence string into token IDs.
Looks up each character in SEQUENCE_VOCAB. Unknown characters map to
the <unk> token (index 3). When add_special_tokens is true, prepends
BOS (<cls> = 0) and appends EOS (<eos> = 2).
Sourcepub fn decode_sequence(&self, token_ids: &[u32]) -> String
pub fn decode_sequence(&self, token_ids: &[u32]) -> String
Decode token IDs back to an amino-acid sequence string.
Skips the standard special tokens (BOS=0, PAD=1, EOS=2, MASK=32) and concatenates the remaining vocabulary entries.
Trait Implementations§
Source§impl Default for EsmSequenceTokenizer
impl Default for EsmSequenceTokenizer
Source§impl EsmTokenizerBase for EsmSequenceTokenizer
impl EsmTokenizerBase for EsmSequenceTokenizer
fn encode(&self) -> Result<()>
fn decode(&self) -> Result<()>
fn mask_token(&self) -> &str
fn mask_token_id(&self) -> u32
fn bos_token(&self) -> &str
fn bos_token_id(&self) -> u32
fn eos_token(&self) -> &str
fn eos_token_id(&self) -> u32
fn pad_token(&self) -> &str
fn pad_token_id(&self) -> u32
fn chain_break_token(&self) -> &str
fn chain_break_token_id(&self) -> u32
fn all_token_ids(&self) -> Vec<u32>
fn special_token_ids(&self) -> Vec<u32>
Auto Trait Implementations§
impl Freeze for EsmSequenceTokenizer
impl RefUnwindSafe for EsmSequenceTokenizer
impl Send for EsmSequenceTokenizer
impl Sync for EsmSequenceTokenizer
impl Unpin for EsmSequenceTokenizer
impl UnsafeUnpin for EsmSequenceTokenizer
impl UnwindSafe for EsmSequenceTokenizer
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
§impl<T> Instrument for T
impl<T> Instrument for T
§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more