Spaces:

research14Lab
/

LingEval

Runtime error

research14 commited on Jan 19, 2024

Commit

a2797f8

1 Parent(s): 971271a

redo vicuna prompt and change model

Files changed (1) hide show

app.py CHANGED Viewed

@@ -5,8 +5,8 @@ import os
 import openai
 # Load the Vicuna 7B model and tokenizer
-vicuna_tokenizer = AutoTokenizer.from_pretrained("lmsys/vicuna-7b-v1.3")
-vicuna_model = AutoModelForCausalLM.from_pretrained("lmsys/vicuna-7b-v1.3")
 # Load the LLaMA 7b model and tokenizer
 llama_tokenizer = AutoTokenizer.from_pretrained("daryl149/llama-2-7b-chat-hf")
@@ -60,8 +60,10 @@ def vicuna_respond(tab_name, message, chat_history):
     print('Vicuna - Prompt + Context:')
     print(formatted_prompt)
     input_ids = vicuna_tokenizer.encode(formatted_prompt, return_tensors="pt")
-    output_ids = vicuna_model.generate(input_ids, do_sample=True, max_length=149, num_beams=5, no_repeat_ngram_size=2)
     bot_message = vicuna_tokenizer.decode(output_ids[0], skip_special_tokens=True)
     print(bot_message)
     chat_history.append((formatted_prompt, bot_message))
@@ -73,7 +75,7 @@ def llama_respond(tab_name, message, chat_history):
     print('Llama - Prompt + Context:')
     print(formatted_prompt)
     input_ids = llama_tokenizer.encode(formatted_prompt, return_tensors="pt")
-    output_ids = llama_model.generate(input_ids, do_sample=True, max_length=149, num_beams=5, no_repeat_ngram_size=2)
     bot_message = llama_tokenizer.decode(output_ids[0], skip_special_tokens=True)
     # Remove formatted prompt from bot_message
     bot_message = bot_message.replace(formatted_prompt, '')

 import openai
 # Load the Vicuna 7B model and tokenizer
+vicuna_tokenizer = AutoTokenizer.from_pretrained("lmsys/vicuna-7b-v1.5-16k")
+vicuna_model = AutoModelForCausalLM.from_pretrained("lmsys/vicuna-7b-v1.5-16k")
 # Load the LLaMA 7b model and tokenizer
 llama_tokenizer = AutoTokenizer.from_pretrained("daryl149/llama-2-7b-chat-hf")
     print('Vicuna - Prompt + Context:')
     print(formatted_prompt)
     input_ids = vicuna_tokenizer.encode(formatted_prompt, return_tensors="pt")
+    output_ids = vicuna_model.generate(input_ids, do_sample=True, max_length=1024, num_beams=5, no_repeat_ngram_size=2)
     bot_message = vicuna_tokenizer.decode(output_ids[0], skip_special_tokens=True)
+    # Remove formatted prompt from bot_message
+    bot_message = bot_message.replace(formatted_prompt, '')
     print(bot_message)
     chat_history.append((formatted_prompt, bot_message))
     print('Llama - Prompt + Context:')
     print(formatted_prompt)
     input_ids = llama_tokenizer.encode(formatted_prompt, return_tensors="pt")
+    output_ids = llama_model.generate(input_ids, do_sample=True, max_length=1024, num_beams=5, no_repeat_ngram_size=2)
     bot_message = llama_tokenizer.decode(output_ids[0], skip_special_tokens=True)
     # Remove formatted prompt from bot_message
     bot_message = bot_message.replace(formatted_prompt, '')