(self, text)
| 170 | self.wordpiece_tokenizer = WordpieceTokenizer(vocab=self.vocab) |
| 171 | |
| 172 | def tokenize(self, text): |
| 173 | split_tokens = [] |
| 174 | for token in self.basic_tokenizer.tokenize(text): |
| 175 | for sub_token in self.wordpiece_tokenizer.tokenize(token): |
| 176 | split_tokens.append(sub_token) |
| 177 | |
| 178 | return split_tokens |
| 179 | |
| 180 | def convert_tokens_to_ids(self, tokens): |
| 181 | return convert_by_vocab(self.vocab, tokens) |
no outgoing calls
no test coverage detected