From 2660c0fa776cf3418e293242cb153a1ee4c635ce Mon Sep 17 00:00:00 2001 From: Jean-Baptiste Lespiau Date: Sun, 22 Oct 2023 07:22:22 -0700 Subject: [PATCH] Make type annotation more precise. PiperOrigin-RevId: 575613181 --- seqio/vocabularies.py | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/seqio/vocabularies.py b/seqio/vocabularies.py index dbe1bea4..229bf9cc 100644 --- a/seqio/vocabularies.py +++ b/seqio/vocabularies.py @@ -431,7 +431,7 @@ def tf_tokenizer(self): return tf_text.SentencepieceTokenizer(model=self.sp_model) @property - def vocab_size(self): + def vocab_size(self) -> int: return self._base_vocab_size @property @@ -454,7 +454,7 @@ def _encode(self, s: str) -> Sequence[int]: """ return self.tokenizer.EncodeAsIds(s) - def _decode(self, ids): + def _decode(self, ids) -> str: """Decode a list of integers to a python string. Args: @@ -980,7 +980,7 @@ def unk_id(self) -> Optional[int]: return self._unk_id @property - def pad_id(self) -> Optional[int]: + def pad_id(self) -> int: return self._pad_id @property @@ -999,7 +999,7 @@ def tf_tokenizer(self): return self._tokenizer @property - def vocab_size(self): + def vocab_size(self) -> int: return self._base_vocab_size def _encode(self, s):