Spaces:

Fecalisboa
/

lucIAna

Runtime error

App Files Files Community

Fecalisboa commited on May 29, 2024

Commit

09c43ee

verified ·

1 Parent(s): 5a1f027

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -1

app.py CHANGED Viewed

@@ -44,6 +44,8 @@ from llama_index.core.node_parser.relational.base_element import (
 )
 from llama_index.core.schema import BaseNode, TextNode
 # Implementations
 # default_persist_directory = './chroma_HF/'
@@ -94,6 +96,7 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
     if llm_model == "mistralai/Mixtral-8x7B-Instruct-v0.3":
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
@@ -103,6 +106,7 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
         raise gr.Error("LLM model is too large to be loaded automatically on free inference endpoint")
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
@@ -110,6 +114,7 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
     elif llm_model == "microsoft/phi-2":
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
@@ -118,7 +123,8 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
         )
     elif llm_model == "TinyLlama/TinyLlama-1.1B-Chat-v1.0":
         llm = HuggingFaceEndpoint(
-            repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = 250,
             top_k = top_k,
@@ -127,6 +133,7 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
         raise gr.Error("Llama-2-7b-chat-hf model requires a Pro subscription...")
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
@@ -134,6 +141,7 @@ def initialize_llmchain(llm_model, temperature, max_tokens, top_k, vector_db, pr
     else:
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,

 )
 from llama_index.core.schema import BaseNode, TextNode
+api_token = os.getenv("HF_TOKEN")
 # Implementations
 # default_persist_directory = './chroma_HF/'
     if llm_model == "mistralai/Mixtral-8x7B-Instruct-v0.3":
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
         raise gr.Error("LLM model is too large to be loaded automatically on free inference endpoint")
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
     elif llm_model == "microsoft/phi-2":
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
         )
     elif llm_model == "TinyLlama/TinyLlama-1.1B-Chat-v1.0":
         llm = HuggingFaceEndpoint(
+            repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = 250,
             top_k = top_k,
         raise gr.Error("Llama-2-7b-chat-hf model requires a Pro subscription...")
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,
     else:
         llm = HuggingFaceEndpoint(
             repo_id=llm_model,
+            huggingfacehub_api_token = api_token,
             temperature = temperature,
             max_new_tokens = max_tokens,
             top_k = top_k,