import json | |
class Tokenizer: | |
def __init__(self, word2int_path, int2word_path): | |
with open(word2int_path, 'r') as f: | |
self.word2int = json.load(f) | |
with open(int2word_path, 'r') as f: | |
self.int2word = {int(k): v for k, v in json.load(f).items()} | |
def encode(self, word): | |
return self.word2int[word] | |
def decode(self, int_val): | |
return self.int2word[int_val] | |