Spaces:

srossitto79
/

AgentLlama007B

Runtime error

App Files Files Community

Salvatore Rossitto commited on Oct 11, 2023

Commit

4190d92

1 Parent(s): 9778c3b

...

Browse files

Files changed (1) hide show

RBotReloaded.py +11 -12

RBotReloaded.py CHANGED Viewed

@@ -69,11 +69,11 @@ def validate_and_fix_params(tool_name, params_list):
 def create_llm(model_id=f"{MODELS_DIR}/mistral-7b-instruct-v0.1.Q4_K_M.gguf", load_4bit=False, load_8bit=False, ctx_len = 8192, temperature=0.5, top_p=0.95):
   if (model_id.startswith("http")):
     print(f"Creating TextGen LLM base_url:{model_id}")
-    return TextGen(model_url=model_id, callbacks=[StreamingStdOutCallbackHandler()])
   if (os.path.exists(model_id)):
     try:
       print(f"Creating LlamaCpp LLM model_id:{model_id}")
-      return LlamaCpp(model_path=model_id, verbose=True, n_batch=521, alpha_value=1,rope_freq_base=10000,compress_pos_emb=ctx_len / 4096, n_ctx=ctx_len, load_in_4bit=load_4bit, load_in_8bit=load_8bit, temperature=temperature,top_p=top_p)
     except Exception as ex:
       try:
         print(f"Creating CTransformers LLM model_id:{model_id}")
@@ -84,7 +84,7 @@ def create_llm(model_id=f"{MODELS_DIR}/mistral-7b-instruct-v0.1.Q4_K_M.gguf", lo
           "top_p":top_p,
           "temperature":temperature
         }
-        return CTransformers(model=model_id, model_type='llama', config=config)
       except Exception as ex:
         print(f"Load Error {str(ex)}")
@@ -269,15 +269,14 @@ AI: SearchAndReply("recent cryptocurrency news")
 USER: Can you calculate the factorial of 5?
 AI: Calculator("factorial(5)")
-### CURRENT CONVERSATION:
-SYS: Today is {str(datetime.now().date())},
-SYS: You are {AI_NAME} a smart and helpful AI assistant with access to external tools and knowledge.
 {formatted_history}
 USER: {input}
-SYS: Please reply last user message directly or invoking a valid action from the following list:
-{self.tools_prompt()}
 AI:
 """
     observations = []
@@ -335,11 +334,11 @@ AI:
             print(f"Action Output: {res}")
             observations.append(f"Action Output: {res}")
-            prompt = prompt + f"Action: {tool.name}({action_input})\nSYS:{res}"
             if (i+1 == self.max_iterations):
                 print(f"MAX ITERATIONS REACHED. PLEASE PROVIDE A FINAL RESPONSE!")
                 prompt = prompt + "\nMAX ITERATIONS REACHED. PLEASE PROVIDE A FINAL RESPONSE!\nAI:"
-                output = str(self.llm(prompt,stop=["USER:","AI:","SYS:","[INST]","[/INST]"])).strip()
                 final_response = "\n*Reasoning: ".join(observations) + f"\n{output}" if len(observations) > 0 else f"\n{output}"
                 return { "output": final_response }
             else:

 def create_llm(model_id=f"{MODELS_DIR}/mistral-7b-instruct-v0.1.Q4_K_M.gguf", load_4bit=False, load_8bit=False, ctx_len = 8192, temperature=0.5, top_p=0.95):
   if (model_id.startswith("http")):
     print(f"Creating TextGen LLM base_url:{model_id}")
+    return TextGen(model_url=model_id, seed=79, callbacks=[StreamingStdOutCallbackHandler()])
   if (os.path.exists(model_id)):
     try:
       print(f"Creating LlamaCpp LLM model_id:{model_id}")
+      return LlamaCpp(model_path=model_id, verbose=True, n_batch=521, seed=79, alpha_value=1,rope_freq_base=10000,compress_pos_emb=ctx_len / 4096, n_ctx=ctx_len, load_in_4bit=load_4bit, load_in_8bit=load_8bit, temperature=temperature,top_p=top_p)
     except Exception as ex:
       try:
         print(f"Creating CTransformers LLM model_id:{model_id}")
           "top_p":top_p,
           "temperature":temperature
         }
+        return CTransformers(model=model_id, model_type='llama', seed=79, config=config)
       except Exception as ex:
         print(f"Load Error {str(ex)}")
 USER: Can you calculate the factorial of 5?
 AI: Calculator("factorial(5)")
+### REAL CONVERSATION:
+[INST]
+SYSTEM: You are {AI_NAME} a smart and helpful AI assistant with access to external tools and knowledge.
+Today is {str(datetime.now().date())}, please reply last user message directly or invoking a valid action from the following list:
+{self.tools_prompt()}
+[/INST]
 {formatted_history}
 USER: {input}
 AI:
 """
     observations = []
             print(f"Action Output: {res}")
             observations.append(f"Action Output: {res}")
+            prompt = prompt + f"Action: {tool.name}({action_input})\SYSTEM:{res}"
             if (i+1 == self.max_iterations):
                 print(f"MAX ITERATIONS REACHED. PLEASE PROVIDE A FINAL RESPONSE!")
                 prompt = prompt + "\nMAX ITERATIONS REACHED. PLEASE PROVIDE A FINAL RESPONSE!\nAI:"
+                output = str(self.llm(prompt,stop=["USER:","AI:","SYS:","SYSTEM:","[INST]","[/INST]"])).strip()
                 final_response = "\n*Reasoning: ".join(observations) + f"\n{output}" if len(observations) > 0 else f"\n{output}"
                 return { "output": final_response }
             else: