iioSnail commited on
Commit
78daf2e
·
1 Parent(s): d292447

Upload bert_tokenizer.py

Browse files
Files changed (1) hide show
  1. bert_tokenizer.py +2 -2
bert_tokenizer.py CHANGED
@@ -135,9 +135,9 @@ class ChineseBertTokenizer(BertTokenizerFast):
135
  pinyin_ids = torch.LongTensor(pinyin_tokens).view(-1)
136
  return input_ids, pinyin_ids
137
 
138
- def convert_ids_to_pinyin_ids(self, ids: List[str]):
139
  pinyin_ids = []
140
- tokens = self.convert_tokens_to_ids(ids)
141
  for token in tokens:
142
  if len(token) > 1:
143
  pinyin_ids.append([0] * 8)
 
135
  pinyin_ids = torch.LongTensor(pinyin_tokens).view(-1)
136
  return input_ids, pinyin_ids
137
 
138
+ def convert_ids_to_pinyin_ids(self, ids: List[int]):
139
  pinyin_ids = []
140
+ tokens = self.convert_ids_to_tokens(ids)
141
  for token in tokens:
142
  if len(token) > 1:
143
  pinyin_ids.append([0] * 8)