Spaces:

mdacampora
/

tax-convos-demo

Runtime error

mdacampora commited on Apr 14, 2023

Commit

c8e23a7

1 Parent(s): 498a9d4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,35 +15,35 @@ tokenizer = AutoTokenizer.from_pretrained(config.base_model_name_or_path)
 # Load the Lora model
 model = PeftModel.from_pretrained(model, peft_model_id)
-def make_inference(problem):
-    batch = tokenizer(
-        problem,
-        return_tensors="pt",
-    )
-    with torch.cuda.amp.autocast():
-        output_tokens = model.generate(**batch, max_new_tokens=50)
-# def make_inference(conversation):
-#     conversation_history = conversation
-#     response = ""
-#     while True:
-#         batch = tokenizer(
-#             f"### Problem:\n{conversation_history}\n{response}",
-#             return_tensors="pt",
-#         )
-#         with torch.cuda.amp.autocast():
-#             output_tokens = model.generate(**batch, max_new_tokens=50)
-#         new_response = tokenizer.decode(output_tokens[0], skip_special_tokens=True)
-#         if new_response.strip() == "":
-#             break
-#         response = f"\n{new_response}"
-#         conversation_history += response
-#     return conversation_history
 if __name__ == "__main__":

 # Load the Lora model
 model = PeftModel.from_pretrained(model, peft_model_id)
+# def make_inference(problem):
+#     batch = tokenizer(
+#         problem,
+#         return_tensors="pt",
+#     )
+#     with torch.cuda.amp.autocast():
+#         output_tokens = model.generate(**batch, max_new_tokens=50)
+def make_inference(conversation):
+    conversation_history = conversation
+    response = ""
+    while True:
+        batch = tokenizer(
+            f"### Problem:\n{conversation_history}\n{response}",
+            return_tensors="pt",
+        )
+        with torch.cuda.amp.autocast():
+            output_tokens = model.generate(**batch, max_new_tokens=50)
+        new_response = tokenizer.decode(output_tokens[0], skip_special_tokens=True)
+        if new_response.strip() == "":
+            break
+        response = f"\n{new_response}"
+        conversation_history += response
+    return conversation_history
 if __name__ == "__main__":