xu song
commited on
Commit
·
34f1177
1
Parent(s):
d8e1d2b
update
Browse files- models/cpp_qwen2.py +5 -2
models/cpp_qwen2.py
CHANGED
@@ -134,12 +134,15 @@ class Qwen2Simulator(Simulator):
|
|
134 |
def tokenize(self, text):
|
135 |
return self.llm.tokenize(text.encode("utf-8"))
|
136 |
|
|
|
|
|
|
|
137 |
def strip_stoptokens(self, tokens):
|
138 |
while tokens and tokens[0] in self.stop_tokens:
|
139 |
-
logger.info(f"striping {tokens[0]}")
|
140 |
tokens.pop(0)
|
141 |
while tokens and tokens[-1] in self.stop_tokens:
|
142 |
-
logger.info(f"striping {tokens[-1]}")
|
143 |
tokens.pop()
|
144 |
return tokens
|
145 |
|
|
|
134 |
def tokenize(self, text):
|
135 |
return self.llm.tokenize(text.encode("utf-8"))
|
136 |
|
137 |
+
def detokenize(self, tokens):
|
138 |
+
return self.llm.detokenize(tokens).decode("utf-8")
|
139 |
+
|
140 |
def strip_stoptokens(self, tokens):
|
141 |
while tokens and tokens[0] in self.stop_tokens:
|
142 |
+
logger.info(f"head-striping {tokens[0]} {self.llm.detokenize([tokens[0]])}")
|
143 |
tokens.pop(0)
|
144 |
while tokens and tokens[-1] in self.stop_tokens:
|
145 |
+
logger.info(f"tail-striping {tokens[-1]} {self.llm.detokenize([tokens[-1]])}")
|
146 |
tokens.pop()
|
147 |
return tokens
|
148 |
|