Spaces:

FranciscoLozDataScience
/

smoker_model

Sleeping

App Files Files Community

FranciscoLozDataScience commited on Mar 21, 2024

Commit

fabb2c0

1 Parent(s): aa94aff

cleaned up code

Browse files

Files changed (2) hide show

app.py +1 -76
model.py +9 -13

app.py CHANGED Viewed

@@ -18,17 +18,6 @@ def predict(
     '''
     Predict the label for the data inputed
     '''
-    # # Combine the input data into a NumPy array
-    # input_array = np.array([
-    #     age, height, weight,
-    #     waist, eye_L, eye_R,
-    #     hear_L, hear_R, systolic,
-    #     relaxation, fasting_blood_sugar, cholesterol,
-    #     triglyceride, HDL, LDL,
-    #     hemoglobin, urine_protein,
-    #     serum_creatinine, AST, ALT,
-    #     Gtp, dental_caries
-    # ])
     # Create a dictionary with input data and dataset var names
     input_data = {
@@ -56,11 +45,10 @@ def predict(
         "dental caries": dental_caries
     }
-    # Convert the dictionary to a pandas DataFrame
     input_df = pd.DataFrame(input_data, index=[0])
     #predict
-    # label = MODEL.predict(input_array)
     label = MODEL.predict(input_df)
     return label
@@ -82,18 +70,8 @@ def load_interface():
     Configure Gradio interface
     '''
-    #example inputs
-    ex=[ #TODO: delete if file works
-        [20,85,135,190,30,125,53,126,0.1,9.9,0.1,9.9,1,2,1,2,79,240,40,140,55,505,72,371,16,405,4,618,1,1660,4.9,20.9,1,6,0.1,10.3,6,1311,1,2062,1,999,0,1],
-        [40,170,65,75.1,1.0,0.9,1,1,120,70,102,225,260,41,132,15.7,1,0.8,24,26,32,0,45,170,75,89.0,0.7,1.2,1,1,100,67,96,258,345,49,140,15.7,1,1.1,26,28,138,0,30],
-        [180,90,94.0,1.0,0.8,1,1,115,72,88,177,103,53,103,13.5,1,1.0,19,29,30,0,60,170,65,78.0,1.5,1.0,1,1,110,70,87,190,210,45,103,14.7,1,0.8,21,21,19,0,55],
-        [175,60,75.0,1.0,1.0,1,1,100,64,93,186,80,86,84,15.4,3,1.0,39,20,35,0,40,160,55,69.0,1.5,1.5,1,1,112,78,90,177,68,78,85,12.4,1,0.5,15,9,14,0,55],
-        [175,60,80.0,1.2,1.5,1.5,1,1,137,89,80,199,35,68,124,16.0,1,1.1,23,19,17,0,55,160,50,68.0,0.8,0.5,1,1,137,87,90,176,36,67,102,13.6,1,0.7,15,14,13,0]
-    ]
     #set blocks
     info_page = gr.Blocks()
-    # model_page = gr.Blocks()
     with info_page:
         # set title and description
@@ -141,59 +119,6 @@ def load_interface():
         """
         )
-    # with model_page:
-    #     # set title and description
-    #     gr.Markdown(
-    #     """
-    #     # Interact with the Ensemble Classifier Model
-    #     Enter sample bio data to predict smoking status.\n
-    #     **Medical Disclaimer**: The predictions provided by this model are for educational purposes only and should not be considered a substitute for professional medical advice.
-    #     """)
-    #     #set inputs in rows of 3
-    #     with gr.Row():
-    #         age = gr.Number(label="Age", precision=0, minimum=0)
-    #         height = gr.Number(label="Height(cm)", precision=0, minimum=0)
-    #         weight = gr.Number(label="Weight(kg)", precision=0, minimum=0)
-    #     with gr.Row():
-    #         waist = gr.Number(label="Waist(cm)", minimum=0, info="Waist circumference length")
-    #         eye_L = gr.Number(label="Visual acuity of the left eye, measured in diopters (D)", minimum=0)
-    #         eye_R = gr.Number(label="Visual acuity of the right eye, measured in diopters (D)", minimum=0)
-    #     with gr.Row():
-    #         hear_L = gr.Radio(label="Is there any hearing ability in the left ear?",choices=[("Yes",1),("No",2)])
-    #         hear_R = gr.Radio(label="Is there any hearing ability in the right ear?",choices=[("Yes",1),("No",2)])
-    #         systolic = gr.Number(label="Systolic(mmHg)", precision=0, minimum=0, info="Blood Pressure")
-    #     with gr.Row():
-    #         relaxation = gr.Number(label="Relaxation(mmHg)", precision=0, minimum=0, info="Blood Pressure")
-    #         fasting_blood_sugar = gr.Number(label="Fasting Blood Sugar(mg/dL)", precision=0, minimum=0, info="the concentration of glucose (sugar) in the bloodstream after an extended period of fasting")
-    #         cholesterol = gr.Number(label="Total Cholesterol(mg/dL)", precision=0, minimum=0, info="Total amount of cholesterol present in the blood")
-    #     with gr.Row():
-    #         triglyceride = gr.Number(label="Triglyceride(mg/dL)", precision=0, minimum=0, info="A type of fat (lipid) found in blood")
-    #         HDL = gr.Number(label="High-Density Lipoprotein(mg/dL) ", precision=0, minimum=0, info="It is commonly referred to as 'good cholesterol'")
-    #         LDL = gr.Number(label="Low-Density Lipoprotein(mg/dL) ", precision=0, minimum=0, info="It is commonly referred to as 'bad cholesterol'")
-    #     with gr.Row():
-    #         hemoglobin = gr.Number(label="Hemoglobin(g/dL)", minimum=0, info="a protein found in red blood cells that is responsible for carrying oxygen from the lungs to the tissues and organs of the body")
-    #         urine_protein = gr.Radio(label="Does urine contain excessive traces of protein?",choices=[("Yes",2),("No",1)], info="when excessive protein is detected in the urine, it may indicate a problem with kidney function or other underlying health conditions.")
-    #         serum_creatinine = gr.Number(label="Serum creatinine(mg/dL)", minimum=0, info="Serum creatinine levels are commonly measured through a blood test and are used to assess kidney function")
-    #     with gr.Row():
-    #         AST = gr.Number(label="Aspartate Aminotransferase(IU/L)", precision=0, minimum=0, info="glutamic oxaloacetic transaminase type; AST is released into the bloodstream when cells are damaged or destroyed, such as during injury or disease affecting organs rich in AST.")
-    #         ALT = gr.Number(label="Alanine Aminotransferase(IU/L)", precision=0, minimum=0, info="glutamic oxaloacetic transaminase type; ALT is primarily found in the liver cells, and increased levels of ALT in the blood can indicate liver damage or disease")
-    #         Gtp = gr.Number(label="Gamma-glutamyl Transferase(IU/L)", precision=0, minimum=0, info="Elevated levels of GGT in the blood can indicate liver disease or bile duct obstruction. GGT levels are often measured alongside other liver function tests to assess liver health and function.")
-    #     dental_caries = gr.Radio(label="Are there any signs of dental cavities?",choices=[("Yes",1),("No",0)])
-    #     #set button row
-    #     with gr.Row():
-    #         pred_btn = gr.Button("Predict")
-    #         clear_btn = gr.Button("Clear")
-    #     #set label txt box
-    #     smoker_label = gr.Label(label="Predicted Label")
-    #     #set event listeners
-    #     inputs = [age, height, weight, waist, eye_L, eye_R, hear_L, hear_R, systolic, relaxation, fasting_blood_sugar, cholesterol, triglyceride, HDL, LDL, hemoglobin, urine_protein, serum_creatinine, AST, ALT, Gtp, dental_caries]
-    #     pred_btn.click(fn=predict, inputs=inputs, outputs=smoker_label)
-    #     clear_btn.click(lambda: [None]*22, outputs=inputs)
     age = gr.Number(label="Age", precision=0, minimum=0)
     height = gr.Number(label="Height(cm)", precision=0, minimum=0)
     weight = gr.Number(label="Weight(kg)", precision=0, minimum=0)

     '''
     Predict the label for the data inputed
     '''
     # Create a dictionary with input data and dataset var names
     input_data = {
         "dental caries": dental_caries
     }
+    # Convert to DataFrame
     input_df = pd.DataFrame(input_data, index=[0])
     #predict
     label = MODEL.predict(input_df)
     return label
     Configure Gradio interface
     '''
     #set blocks
     info_page = gr.Blocks()
     with info_page:
         # set title and description
         """
         )
     age = gr.Number(label="Age", precision=0, minimum=0)
     height = gr.Number(label="Height(cm)", precision=0, minimum=0)
     weight = gr.Number(label="Weight(kg)", precision=0, minimum=0)

model.py CHANGED Viewed

@@ -9,6 +9,14 @@ from sklearn.neighbors import KNeighborsClassifier
 from sklearn.svm import SVC
 class SmokerModel:
     def __init__(self, model_path, scaler_path):
         self.model = load(model_path)
         self.scaler = load(scaler_path)
@@ -31,7 +39,7 @@ class SmokerModel:
         return new_data_scaled
-    def predict(self, X: np.ndarray) -> str: #TODO: change type to pd df
         """
         Make a prediction on one sample using the loaded model.
@@ -47,22 +55,10 @@ class SmokerModel:
         # scale the data
         X_scaled = self.scale(X)
-        # Check if the array is 1-dimensional aka one sample
-        # if len(X_scaled.shape) != 1:
-        #     raise ValueError("Input array must be one-dimensional (one sample), but got a shape of {}".format(X.shape))
-        #     return
         #check array only has one sample
         if X.shape[0] != 1:
             raise ValueError("Input array must contain only one sample, but {} samples were found".format(X.shape[0]))
             return
-        # Reshape the array
-        # X = X.reshape(1, -1)
-        # X_scaled = X_scaled.reshape(1, -1)
-        # # scale the data
-        # X_scaled = self.scale(X)
         # Now, use the scaled data to make predictions using the loaded model
         array = self.model.predict(X_scaled)

 from sklearn.svm import SVC
 class SmokerModel:
+    """
+    Smoker Model Class that can predict new instances
+    INPUTS
+    ---
+    model_path: the path to the model file
+    scaler_path: the path to the min max scaler file
+    """
     def __init__(self, model_path, scaler_path):
         self.model = load(model_path)
         self.scaler = load(scaler_path)
         return new_data_scaled
+    def predict(self, X: pd.DataFrame) -> str:
         """
         Make a prediction on one sample using the loaded model.
         # scale the data
         X_scaled = self.scale(X)
         #check array only has one sample
         if X.shape[0] != 1:
             raise ValueError("Input array must contain only one sample, but {} samples were found".format(X.shape[0]))
             return
         # Now, use the scaled data to make predictions using the loaded model
         array = self.model.predict(X_scaled)