Spaces:

JerniganLab
/

interview-and-qa

Sleeping

tolulope commited on Jan 4

Commit

9741ad8

verified ·

1 Parent(s): 6535a3b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -9,13 +9,15 @@ HF_TOKEN = os.environ.get("HF_TOKEN")
 model_id = "JerniganLab/interviews-and-qa"
 base_model = "meta-llama/Meta-Llama-3-8B-Instruct"
 pipeline = transformers.pipeline(
     "text-generation",
-    model=base_model,
     model_kwargs={"torch_dtype": torch.bfloat16},
     device="cuda",
 )
-pipeline.model = PeftModel.from_pretrained(base_model, model_id)
 def chat_function(message, history, system_prompt, max_new_tokens, temperature):
     messages = [{"role":"system","content":system_prompt},

 model_id = "JerniganLab/interviews-and-qa"
 base_model = "meta-llama/Meta-Llama-3-8B-Instruct"
+llama_model = transformers.AutoModelforCausalLM(base_model)
 pipeline = transformers.pipeline(
     "text-generation",
+    model=llama_model,
     model_kwargs={"torch_dtype": torch.bfloat16},
     device="cuda",
 )
+pipeline.model = PeftModel.from_pretrained(llama_model, model_id)
 def chat_function(message, history, system_prompt, max_new_tokens, temperature):
     messages = [{"role":"system","content":system_prompt},