Spaces:

Somekindofathing
/

ontology-individuals-filler

Paused

theosaurus commited on Jan 23

Commit

b6072e3

1 Parent(s): 504b277

Add GPU decorator to generate_response function and improve login feedback

Files changed (1) hide show

app.py CHANGED Viewed

@@ -58,7 +58,6 @@ llm_model = AutoModelForCausalLM.from_pretrained(
     quantization_config=model_config,
     device_map="auto")
-@spaces.GPU
 def initialize_llm():
     """
     Initialize the LLM with careful memory management.
@@ -79,6 +78,7 @@ def initialize_llm():
     return model, tokenizer
 def generate_response(prompt:str, history: Optional[list], llm: Optional[AutoModelForCausalLM], tokenizer, max_length: int = 100) -> str:
     """
     Generate a response from the LLM model given a prompt.
@@ -111,8 +111,8 @@ demo =  gr.ChatInterface(
 if __name__ == "__main__":
     auth = HuggingFaceLogin()
-    auth.login()
-    # Initialize the model and tokenizer
     llm_model, llm_tokenizer = initialize_llm()
     demo.launch()

     quantization_config=model_config,
     device_map="auto")
 def initialize_llm():
     """
     Initialize the LLM with careful memory management.
     return model, tokenizer
+@spaces.GPU
 def generate_response(prompt:str, history: Optional[list], llm: Optional[AutoModelForCausalLM], tokenizer, max_length: int = 100) -> str:
     """
     Generate a response from the LLM model given a prompt.
 if __name__ == "__main__":
     auth = HuggingFaceLogin()
+    if auth.login():
+        print("Login successful!")
     llm_model, llm_tokenizer = initialize_llm()
     demo.launch()