M3Site / esm /tokenization /tokenizer_base.py
anonymousforpaper's picture
Upload 103 files
224a33f verified
raw
history blame contribute delete
691 Bytes
from typing import Protocol, runtime_checkable
@runtime_checkable
class EsmTokenizerBase(Protocol):
def encode(self, *args, **kwargs):
...
def decode(self, *args, **kwargs):
...
@property
def mask_token(self) -> str:
...
@property
def mask_token_id(self) -> int:
...
@property
def bos_token(self) -> str:
...
@property
def bos_token_id(self) -> int:
...
@property
def eos_token(self) -> str:
...
@property
def eos_token_id(self) -> int:
...
@property
def pad_token(self) -> str:
...
@property
def pad_token_id(self) -> int:
...