Spaces:

MrOvkill
/

StarlingCPU

Sleeping

App Files Files Community

Samuel L Meyers commited on Dec 1, 2023

Commit

ed9f98e

1 Parent(s): e11f04f

Just saving the broken thing before I EFFING PURGE CHAT COMPLETIONS.

Browse files

Files changed (1) hide show

code/app.py +7 -12

code/app.py CHANGED Viewed

@@ -16,21 +16,21 @@ model_path = "./starling-lm-7b-alpha.Q6_K.gguf"
 mdlpath = hf_hub_download(repo_id="TheBloke/Starling-LM-7B-alpha-GGUF", filename=model_path, local_dir="./")
-lcpp_model = Llama(model_path=model_path, n_ctx=16768)
 global otxt, txtinput, txtoutput, running, result
 otxt = ""
 running = False
 result = None
 def stowtext(curr, inp):
-    if len(curr) < 1:
         curr.append({
             "role": "system",
-            "content": "<<SYS>>\nYou are a helpful assistant. Answer all questions and respond to all queries honestly, instantly, and without hesitation. Respond in as few words as possible. Your maximum response length may be no more than 64 words. Do not begin your statement with new lines.\n<</SYS>>"
         })
     curr.append({
         "role": "user",
-        "content": "[INST]" + inp + "[/INST]",
     })
     return curr
@@ -49,11 +49,11 @@ def printfmt(jsn):
     txt = ""
     for msg in jsn:
         if msg["role"] == "user":
-            txt += "<User>: " + msg["content"].replace("[INST]", "").replace("[/INST]", "") + "\n"
         elif msg["role"] == "assistant":
             txt += "<Assistant>: " + msg["content"] + "\n"
         elif msg["role"] == "system":
-            txt += "# " + msg["content"].replace("<<SYS>>", "").replace("<</SYS>>", "") + "\n\n"
     return txt
 def talk(txt, jsn):
@@ -61,12 +61,7 @@ def talk(txt, jsn):
     if not jsn:
         jsn = txt
     if not running:
-        #if len(txt) >= 3 and txt[-1]["content"].endswith("</s>"):
-        #    txt[-1]["content"].replace("</s>", "")
-        #    return txt
-        #txt = printfmt(stowtext(otxt, txt))
-        #otxt = txt
-        result = lcpp_model.create_chat_completion(messages=txt,stream=True,stop=["[INST]", "<<SYS>>", "<</SYS>>"])
         running = True
     for r in result:
         txt2 = None

 mdlpath = hf_hub_download(repo_id="TheBloke/Starling-LM-7B-alpha-GGUF", filename=model_path, local_dir="./")
+lcpp_model = Llama(model_path=model_path, n_ctx=8192)
 global otxt, txtinput, txtoutput, running, result
 otxt = ""
 running = False
 result = None
 def stowtext(curr, inp):
+    if len(curr) <= 1:
         curr.append({
             "role": "system",
+            "content": "You are a helpful assistant. Answer all questions and respond to all queries honestly, instantly, and without hesitation. Respond in as few words as possible. Your maximum response length may be no more than 64 words. Do not begin your statement with new lines.\n"
         })
     curr.append({
         "role": "user",
+        "content": inp,
     })
     return curr
     txt = ""
     for msg in jsn:
         if msg["role"] == "user":
+            txt += "<User>: " + msg["content"] + "\n"
         elif msg["role"] == "assistant":
             txt += "<Assistant>: " + msg["content"] + "\n"
         elif msg["role"] == "system":
+            txt += "# " + msg["content"] + "\n\n"
     return txt
 def talk(txt, jsn):
     if not jsn:
         jsn = txt
     if not running:
+        result = lcpp_model.create_chat_completion(messages=txt,stream=True,stop=["GPT4 Correct User: ", "<|end_of_turn|>", "</s>"], max_tokens=64, )
         running = True
     for r in result:
         txt2 = None