xzuyn commited on
Commit
d449931
·
verified ·
1 Parent(s): 37f3323

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -3
app.py CHANGED
@@ -18,7 +18,7 @@ def tokenize(input_text):
18
  codeqwen_tokens = len(codeqwen_tokenizer(input_text, add_special_tokens=True)["input_ids"])
19
  rwkv4_tokens = len(rwkv4_tokenizer(input_text, add_special_tokens=True)["input_ids"])
20
  rwkv5_tokens = len(rwkv5_tokenizer(input_text, add_special_tokens=True)["input_ids"])
21
- deepseek_tokens = len(deepseek_tokenizer(input_text, add_special_tokens=True)["input_ids"])
22
  internlm_tokens = len(internlm_tokenizer(input_text, add_special_tokens=True)["input_ids"])
23
  internlm2_tokens = len(internlm2_tokenizer(input_text, add_special_tokens=True)["input_ids"])
24
 
@@ -38,7 +38,7 @@ def tokenize(input_text):
38
  "CodeQwen": codeqwen_tokens,
39
  "RWKV-v4": rwkv4_tokens,
40
  "RWKV-v5/RWKV-v6": rwkv5_tokens,
41
- "DeepSeek-LLM/DeepSeek-V2": deepseek_tokens,
42
  "InternLM": internlm_tokens,
43
  "InternLM2": internlm2_tokens
44
  }
@@ -65,7 +65,7 @@ if __name__ == "__main__":
65
  codeqwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/CodeQwen1.5-7B")
66
  rwkv4_tokenizer = AutoTokenizer.from_pretrained("RWKV/rwkv-4-14b-pile", trust_remote_code=True)
67
  rwkv5_tokenizer = AutoTokenizer.from_pretrained("RWKV/v5-EagleX-v2-7B-HF", trust_remote_code=True)
68
- deepseek_tokenizer = AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-V2", trust_remote_code=True)
69
  internlm_tokenizer = AutoTokenizer.from_pretrained("internlm/internlm-20b", trust_remote_code=True)
70
  internlm2_tokenizer = AutoTokenizer.from_pretrained("internlm/internlm2-20b", trust_remote_code=True)
71
 
 
18
  codeqwen_tokens = len(codeqwen_tokenizer(input_text, add_special_tokens=True)["input_ids"])
19
  rwkv4_tokens = len(rwkv4_tokenizer(input_text, add_special_tokens=True)["input_ids"])
20
  rwkv5_tokens = len(rwkv5_tokenizer(input_text, add_special_tokens=True)["input_ids"])
21
+ deepseekv2_tokens = len(deepseekv2_tokenizer(input_text, add_special_tokens=True)["input_ids"])
22
  internlm_tokens = len(internlm_tokenizer(input_text, add_special_tokens=True)["input_ids"])
23
  internlm2_tokens = len(internlm2_tokenizer(input_text, add_special_tokens=True)["input_ids"])
24
 
 
38
  "CodeQwen": codeqwen_tokens,
39
  "RWKV-v4": rwkv4_tokens,
40
  "RWKV-v5/RWKV-v6": rwkv5_tokens,
41
+ "DeepSeek-V2": deepseekv2_tokens,
42
  "InternLM": internlm_tokens,
43
  "InternLM2": internlm2_tokens
44
  }
 
65
  codeqwen_tokenizer = AutoTokenizer.from_pretrained("Qwen/CodeQwen1.5-7B")
66
  rwkv4_tokenizer = AutoTokenizer.from_pretrained("RWKV/rwkv-4-14b-pile", trust_remote_code=True)
67
  rwkv5_tokenizer = AutoTokenizer.from_pretrained("RWKV/v5-EagleX-v2-7B-HF", trust_remote_code=True)
68
+ deepseekv2_tokenizer = AutoTokenizer.from_pretrained("deepseek-ai/DeepSeek-V2", trust_remote_code=True)
69
  internlm_tokenizer = AutoTokenizer.from_pretrained("internlm/internlm-20b", trust_remote_code=True)
70
  internlm2_tokenizer = AutoTokenizer.from_pretrained("internlm/internlm2-20b", trust_remote_code=True)
71