Upload bert_tokenizer.py
Browse files- bert_tokenizer.py +2 -2
bert_tokenizer.py
CHANGED
@@ -135,9 +135,9 @@ class ChineseBertTokenizer(BertTokenizerFast):
|
|
135 |
pinyin_ids = torch.LongTensor(pinyin_tokens).view(-1)
|
136 |
return input_ids, pinyin_ids
|
137 |
|
138 |
-
def convert_ids_to_pinyin_ids(self, ids: List[
|
139 |
pinyin_ids = []
|
140 |
-
tokens = self.
|
141 |
for token in tokens:
|
142 |
if len(token) > 1:
|
143 |
pinyin_ids.append([0] * 8)
|
|
|
135 |
pinyin_ids = torch.LongTensor(pinyin_tokens).view(-1)
|
136 |
return input_ids, pinyin_ids
|
137 |
|
138 |
+
def convert_ids_to_pinyin_ids(self, ids: List[int]):
|
139 |
pinyin_ids = []
|
140 |
+
tokens = self.convert_ids_to_tokens(ids)
|
141 |
for token in tokens:
|
142 |
if len(token) > 1:
|
143 |
pinyin_ids.append([0] * 8)
|