PrajwalS commited on
Commit
768b288
·
1 Parent(s): 060414e

add tokenizer

Browse files
Files changed (2) hide show
  1. .gitignore +1 -0
  2. vocab.json +1 -1
.gitignore ADDED
@@ -0,0 +1 @@
 
 
1
+ checkpoint-*/
vocab.json CHANGED
@@ -1 +1 @@
1
- {"r": 0, "y": 1, "v": 2, "l": 3, "o": 4, "h": 5, "g": 6, "'": 7, "b": 8, "w": 9, "i": 10, "s": 11, "t": 12, "c": 13, "a": 14, "e": 15, "z": 16, "u": 17, "q": 18, "f": 19, "x": 20, "m": 21, "n": 23, "j": 24, "k": 25, "d": 26, "p": 27, "|": 22, "[UNK]": 28, "[PAD]": 29}
 
1
+ {"e": 0, "g": 1, "w": 2, "o": 3, "b": 4, "r": 5, "t": 6, "a": 7, "n": 8, "q": 9, "u": 10, "i": 11, "p": 12, "k": 13, "f": 14, "m": 15, "c": 16, "y": 17, "l": 18, "h": 19, "d": 21, "x": 22, "j": 23, "s": 24, "z": 25, "v": 26, "'": 27, "|": 20, "[UNK]": 28, "[PAD]": 29}