Spaces:

adi2606
/

MenstrualQA

Sleeping

adi2606 commited on Aug 5, 2024

Commit

dbb3b1f

verified ·

1 Parent(s): 22209ca

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,24 +10,23 @@ model = AutoModelForCausalLM.from_pretrained("adi2606/MenstrualQA").to(device)
 tokenizer = AutoTokenizer.from_pretrained("adi2606/MenstrualQA")
 # Function to generate a response from the chatbot
-def generate_response(message: str, temperature: float = 0.4, repetition_penalty: float = 1.1, max_input_length: int = 256) -> str:
-    inputs = tokenizer(
-        message,
-        return_tensors="pt",
-        padding=True,
-        truncation=True,
-        max_length=max_input_length
     ).to(device)
     # Generate the response
     output = model.generate(
-        inputs['input_ids'],
-        attention_mask=inputs['attention_mask'],
         max_length=512,
         temperature=temperature,
         repetition_penalty=repetition_penalty,
-        do_sample=True,
-        pad_token_id=tokenizer.eos_token_id
     )
     # Decode the generated output

 tokenizer = AutoTokenizer.from_pretrained("adi2606/MenstrualQA")
 # Function to generate a response from the chatbot
+def generate_response(message: str, temperature: float = 0.4, repetition_penalty: float = 1.1) -> str:
+    # Apply the chat template and convert to PyTorch tensors
+    messages = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": message}
+    ]
+    input_ids = tokenizer.apply_chat_template(
+        messages, add_generation_prompt=True, return_tensors="pt"
     ).to(device)
     # Generate the response
     output = model.generate(
+        input_ids,
         max_length=512,
         temperature=temperature,
         repetition_penalty=repetition_penalty,
+        do_sample=True
     )
     # Decode the generated output