Skip to content
Open
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 4 additions & 4 deletions seqio/vocabularies.py
Original file line number Diff line number Diff line change
Expand Up @@ -431,7 +431,7 @@ def tf_tokenizer(self):
return tf_text.SentencepieceTokenizer(model=self.sp_model)

@property
def vocab_size(self):
def vocab_size(self) -> int:
return self._base_vocab_size

@property
Expand All @@ -454,7 +454,7 @@ def _encode(self, s: str) -> Sequence[int]:
"""
return self.tokenizer.EncodeAsIds(s)

def _decode(self, ids):
def _decode(self, ids) -> str:
"""Decode a list of integers to a python string.

Args:
Expand Down Expand Up @@ -980,7 +980,7 @@ def unk_id(self) -> Optional[int]:
return self._unk_id

@property
def pad_id(self) -> Optional[int]:
def pad_id(self) -> int:
return self._pad_id

@property
Expand All @@ -999,7 +999,7 @@ def tf_tokenizer(self):
return self._tokenizer

@property
def vocab_size(self):
def vocab_size(self) -> int:
return self._base_vocab_size

def _encode(self, s):
Expand Down