Spaces:

Dekode
/

betterzila_assignment

Sleeping

App Files Files Community

Pratik Dwivedi commited on Jan 26, 2024

Commit

d9c6906

1 Parent(s): 9bf72c1

multiple models

Browse files

Files changed (1) hide show

app.py +25 -6

app.py CHANGED Viewed

@@ -8,14 +8,25 @@ def register_gguf_model():
     prompter = Prompt()
-    your_model_name = "my_model"
     hf_repo_name = "TheBloke/Llama-2-7B-Chat-GGUF"
     model_file = "llama-2-7b-chat.Q5_K_S.gguf"
-    print("registering model")
     prompter.model_catalog.register_gguf_model(your_model_name,hf_repo_name, model_file, prompt_wrapper="open_chat")
-    print("loading model")
-    prompter.load_model(your_model_name)
     return prompter
 def load_pdf_from_url(url):
@@ -33,15 +44,20 @@ def load_pdf_content(pdf):
 def main():
     st.title("BetterZila RAG Enabled LLM")
     with st.spinner("Loading model..."):
-        prompter = register_gguf_model()
     st.success("Model loaded!")
     with st.spinner("Loading PDF content from the assignment URL..."):
         url = "https://pgcag.files.wordpress.com/2010/01/48lawsofpower.pdf"
         pdf = load_pdf_from_url(url)
         content = load_pdf_content(pdf)
     st.success("PDF content loaded!")
     queries = ['Can you give me an example from history where the enemy was crushed totally from the book?', "What's the point of making myself less accessible?", "Can you tell me the story of Queen Elizabeth I from this 48 laws of power book?"]
@@ -49,8 +65,11 @@ def main():
     for query in queries:
         st.subheader(f"Query: {query}")
         with st.spinner("Generating response..."):
             resp = prompter.prompt_main(query, context=content)
             response = resp['llm_response']
         st.success("Response generated!")
         st.write(response)

     prompter = Prompt()
+    your_model_name = "llama"
     hf_repo_name = "TheBloke/Llama-2-7B-Chat-GGUF"
     model_file = "llama-2-7b-chat.Q5_K_S.gguf"
+    print("registering models")
     prompter.model_catalog.register_gguf_model(your_model_name,hf_repo_name, model_file, prompt_wrapper="open_chat")
+    your_model_name = "open_gpt4"
+    hf_repo_name = "TheBloke/Open_Gpt4_8x7B-GGUF"
+    model_file = "open_gpt4_8x7b.Q4_K_M.gguf"
+    prompter.model_catalog.register_gguf_model(your_model_name,hf_repo_name, model_file, prompt_wrapper="open_chat")
+    your_model_name = "phi2"
+    hf_repo_name = "TheBloke/phi-2-GGUF"
+    model_file = "phi-2.Q4_K_M.gguf"
+    prompter.model_catalog.register_gguf_model(your_model_name,hf_repo_name, model_file, prompt_wrapper="open_chat")
+    your_model_name = "mistral"
+    hf_repo_name = "TheBloke/Mistral-7B-Instruct-v0.2-GGUF"
+    model_file = "mistral-7b-instruct-v0.2.Q4_K_M.gguf"
+    prompter.model_catalog.register_gguf_model(your_model_name,hf_repo_name, model_file, prompt_wrapper="open_chat")
+    # print("loading model")
+    # prompter.load_model(your_model_name)
     return prompter
 def load_pdf_from_url(url):
 def main():
     st.title("BetterZila RAG Enabled LLM")
+    with st.spinner("Registering Models for use..."):
+        prompter = register_gguf_model()
+    model_name = st.selectbox("Select Model", ["llama", "open_gpt4", "phi2", "mistral"])
+    st.write("You selected: ", model_name)
     with st.spinner("Loading model..."):
+        prompter.load_model(model_name)
     st.success("Model loaded!")
     with st.spinner("Loading PDF content from the assignment URL..."):
         url = "https://pgcag.files.wordpress.com/2010/01/48lawsofpower.pdf"
         pdf = load_pdf_from_url(url)
         content = load_pdf_content(pdf)
+        print("Loaded PDF content")
     st.success("PDF content loaded!")
     queries = ['Can you give me an example from history where the enemy was crushed totally from the book?', "What's the point of making myself less accessible?", "Can you tell me the story of Queen Elizabeth I from this 48 laws of power book?"]
     for query in queries:
         st.subheader(f"Query: {query}")
         with st.spinner("Generating response..."):
+            print("Query: ", query)
             resp = prompter.prompt_main(query, context=content)
             response = resp['llm_response']
+            print("Time taken: ", response['usage']['processing_time'])
+            print("Response: ", response)
         st.success("Response generated!")
         st.write(response)