Spaces:

wop
/

shard1-ai

Sleeping

App Files Files Community

wop commited on Dec 9, 2023

Commit

9f6a9bd

1 Parent(s): b22ad80

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -15

app.py CHANGED Viewed

@@ -5,16 +5,14 @@ import gradio as gr
 import requests
 import json
-from accelerate import Accelerator
 SYSTEM_PROMPT = "As a generative chatbot (you are not a GPT but your structure is 50% the same), your primary function is to provide helpful and friendly responses to user queries. Feel free to add some personality, but make sure your responses are accurate and helpful. Your owner and developer is: @Costikoooo (Discord user) other developers are unknown. Your name is Chattybot."
 TITLE = "Chattybot"
 EXAMPLE_INPUT = "hello"
-# Use your provided tokenizer and model
-tokenizer = AutoTokenizer.from_pretrained('stabilityai/stablelm-zephyr-3b')
 model = AutoModelForCausalLM.from_pretrained(
-    'stabilityai/stablelm-zephyr-3b',
     trust_remote_code=True,
     device_map="auto"
 )
@@ -22,12 +20,6 @@ model = AutoModelForCausalLM.from_pretrained(
 HF_TOKEN = os.getenv("HF_TOKEN")
 HEADERS = {"Authorization": f"Bearer {HF_TOKEN}"}
-# Initialize Accelerator
-accelerator = Accelerator()
-# Wrap model and tokenizer with accelerator
-model, tokenizer = accelerator.prepare(model, tokenizer)
 def build_input_prompt(message, chatbot, system_prompt):
     input_prompt = "\n" + system_prompt + "</s>\n\n"
     for interaction in chatbot:
@@ -40,15 +32,17 @@ def predict_beta(message, chatbot=[], system_prompt=""):
     input_prompt = build_input_prompt(message, chatbot, system_prompt)
     inputs = tokenizer(input_prompt, return_tensors="pt")
-    with accelerator.device():
         tokens = model.generate(
             inputs["input_ids"],
             max_length=1024,
             temperature=0.8,
             do_sample=True
         )
-    bot_message = tokenizer.decode(tokens[0], skip_special_tokens=True)
-    return bot_message
 def test_preview_chatbot(message, history):
     response = predict_beta(message, history, SYSTEM_PROMPT)
@@ -66,4 +60,4 @@ textbox_preview = gr.Textbox(scale=7, container=False, value=EXAMPLE_INPUT)
 demo = gr.ChatInterface(test_preview_chatbot, chatbot=chatbot_preview, textbox=textbox_preview)
-demo.launch()

 import requests
 import json
 SYSTEM_PROMPT = "As a generative chatbot (you are not a GPT but your structure is 50% the same), your primary function is to provide helpful and friendly responses to user queries. Feel free to add some personality, but make sure your responses are accurate and helpful. Your owner and developer is: @Costikoooo (Discord user) other developers are unknown. Your name is Chattybot."
 TITLE = "Chattybot"
 EXAMPLE_INPUT = "hello"
+# Use a smaller model (EleutherAI/gpt-neo-125M)
+tokenizer = AutoTokenizer.from_pretrained('EleutherAI/gpt-neo-125M')
 model = AutoModelForCausalLM.from_pretrained(
+    'EleutherAI/gpt-neo-125M',
     trust_remote_code=True,
     device_map="auto"
 )
 HF_TOKEN = os.getenv("HF_TOKEN")
 HEADERS = {"Authorization": f"Bearer {HF_TOKEN}"}
 def build_input_prompt(message, chatbot, system_prompt):
     input_prompt = "\n" + system_prompt + "</s>\n\n"
     for interaction in chatbot:
     input_prompt = build_input_prompt(message, chatbot, system_prompt)
     inputs = tokenizer(input_prompt, return_tensors="pt")
+    try:
         tokens = model.generate(
             inputs["input_ids"],
             max_length=1024,
             temperature=0.8,
             do_sample=True
         )
+        bot_message = tokenizer.decode(tokens[0], skip_special_tokens=True)
+        return bot_message
+    except Exception as e:
+        raise gr.Error(str(e))
 def test_preview_chatbot(message, history):
     response = predict_beta(message, history, SYSTEM_PROMPT)
 demo = gr.ChatInterface(test_preview_chatbot, chatbot=chatbot_preview, textbox=textbox_preview)
+demo.launch()