Spaces:

acorreal
/

AML3304

Paused

Jesus Andres Correal Ortiz commited on Aug 4, 2024

Commit

0a0007f

1 Parent(s): 3719454

Updated app.py to fix error in dbtypes

Files changed (2) hide show

app.py CHANGED Viewed

@@ -7,21 +7,33 @@ model_name = "acorreal/phi3-project-management"
 tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForSequenceClassification.from_pretrained(model_name)
 # Streamlit app
 st.title('Project Management Educational Tutor')
-st.write('This app uses the "acorreal/phi3-project-management" model')
 user_input = st.text_area("Enter your project management question or topic here:")
 if st.button('Get Response'):
     if user_input:
-        inputs = tokenizer(user_input, return_tensors="pt")
         with torch.no_grad():
             outputs = model(**inputs)
             logits = outputs.logits
             predicted_class_id = logits.argmax().item()
         st.write(f"Predicted class ID: {predicted_class_id}")
-        # You can add more logic here to provide detailed responses based on the predicted_class_id
     else:
         st.write("Please enter a question or topic to get a response.")

 tokenizer = AutoTokenizer.from_pretrained(model_name)
 model = AutoModelForSequenceClassification.from_pretrained(model_name)
+# Ensure the model is on the correct device and using the right dtype
+device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
+model.to(device)
+model.eval()  # Set model to evaluation mode
 # Streamlit app
 st.title('Project Management Educational Tutor')
+st.write('This app uses the "acorreal/phi3-project-management" model to provide insights on project management topics.')
 user_input = st.text_area("Enter your project management question or topic here:")
 if st.button('Get Response'):
     if user_input:
+        # Tokenize the input and move it to the correct device
+        inputs = tokenizer(user_input, return_tensors="pt").to(device)
+        # Ensure inputs are in the correct dtype
+        inputs = {k: v.to(dtype=torch.float32 if model.dtype == torch.float32 else torch.float16) for k, v in inputs.items()}
         with torch.no_grad():
             outputs = model(**inputs)
             logits = outputs.logits
             predicted_class_id = logits.argmax().item()
         st.write(f"Predicted class ID: {predicted_class_id}")
     else:
         st.write("Please enter a question or topic to get a response.")

fine-tuning.ipynb CHANGED Viewed

@@ -71,8 +71,13 @@
       },
       "outputs": [],
       "source": [
         "base_model_name = \"microsoft/Phi-3-mini-4k-instruct\"\n",
         "model_name=\"acorreal/project-management-tutor\"\n",
         "use_4bit = True\n",
         "bnb_4bit_quant_type = \"nf4\"\n",
         "use_double_quant = True\n",

       },
       "outputs": [],
       "source": [
+        "# Name of the model to use as parent model\n",
         "base_model_name = \"microsoft/Phi-3-mini-4k-instruct\"\n",
+        "\n",
+        "# Name of the new model\n",
         "model_name=\"acorreal/project-management-tutor\"\n",
+        "\n",
+        "# Set the model configuration\n",
         "use_4bit = True\n",
         "bnb_4bit_quant_type = \"nf4\"\n",
         "use_double_quant = True\n",