alinJain
/

DriverPredictionFinal

Model card Files Files and versions Community

alinJain commited on Dec 23, 2024

Commit

bb1009c

verified ·

1 Parent(s): dfb7845

Upload driverpospredictionfinal.py

Browse files

Files changed (1) hide show

driverpospredictionfinal.py +239 -0

driverpospredictionfinal.py ADDED Viewed

	@@ -0,0 +1,239 @@

+# -*- coding: utf-8 -*-
+"""DriverPosPredictionFinal
+Automatically generated by Colab.
+Original file is located at
+    https://colab.research.google.com/drive/1DGTfO4HEZDof1phuficJD_J8v38JnF3C
+"""
+from sklearn import tree, linear_model
+from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
+from sklearn.model_selection import train_test_split, GridSearchCV
+!pip install bayesian-optimization
+from bayes_opt import BayesianOptimization
+from sklearn.metrics import mean_squared_error, mean_absolute_error, r2_score, mean_squared_log_error, median_absolute_error
+import pandas as pd
+import joblib
+import matplotlib.pyplot as plt
+import seaborn as sns
+import numpy as np
+import xgboost as xgb
+import pickle
+def read_data(file_name):
+  df = pd.read_csv(file_name)
+  x= df.drop(['RaceID', "Pos", "formating" ], axis=1)
+  y =df["Pos"]
+  return x,y
+#returns the object for model being used
+def decision_tree_regressor_method():
+  dtree = DecisionTreeRegressor(random_state=42)
+  return dtree
+def decsison_tree_classifier_method(X_train,y_train):
+  dtree = DecisionTreeClassifier()
+  dtree = dtree.fit(X_train,y_train)
+  return dtree
+def linear_reg(X_train,y_train):
+  regr= linear_model.LinearRegression()
+  regr.fit(X_train,y_train)
+  return regr
+def hyper_paramter_tuning(model, xtrain,ytrain,**kwargs): #doesnt work for linear regression
+  #dtree = DecisionTreeRegressor(random_state=42)
+#  grid_search_object = GridSearchCV(estimator=model, param_grid=kwargs, cv=5, n_jobs=-1, verbose=2, scoring='neg_mean_squared_error')
+  grid_search_object = GridSearchCV(estimator=model, param_grid=kwargs, cv=3, n_jobs=-1, verbose=2, scoring='neg_mean_squared_error')
+  grid_search_object.fit(xtrain,ytrain)
+  best_estimator = grid_search_object.best_estimator_
+  return best_estimator
+def predict(model, xtest,ytest):
+    # Predict the target for the test set
+    y_pred = model.predict(xtest)
+    # Calculate various evaluation metrics
+    mse = mean_squared_error(ytest, y_pred)
+    rmse = mse ** 0.5
+    mae = mean_absolute_error(ytest, y_pred)
+    r2 = r2_score(ytest, y_pred)
+    msle = mean_squared_log_error(ytest, y_pred)
+    medae = median_absolute_error(ytest, y_pred)
+    # Print the metrics
+    print(f"Test MSE: {mse}") # smaller is better - mean squared error
+    print(f"Test RMSE: {rmse}")#
+    print(f"Test MAE: {mae}")
+    print(f"Test R²: {r2}")
+    print(f"Test MSLE: {msle}")
+    print(f"Test Median Absolute Error: {medae}")
+    #rmse measures abg magnitude of errors betwen actual and predicted values
+    return y_pred
+def hyperamter_tuning_paramter_grid():
+  parameter_grid = {'max_depth': [1,2,3,4,5,None],
+     "min_samples_split":[2,3,5,6] ,
+     'min_samples_leaf': [1,2,4,5],
+     "min_weight_fraction_leaf": [0.0,0.01, 0.05,0.1, 0.2],# add more hypermater tuning criteria
+    }#'criterion': ['gini', 'entropy']
+  return parameter_grid
+def ask_user(model, X_test=None):
+    """
+    Collect user input and format it for prediction.
+    Returns a DataFrame with a single row formatted like the training data.
+    """
+    try:
+        # Create a dictionary to store inputs
+        input_data = {}
+        # Collect basic race information
+        input_data['LapNumber'] = float(input("Enter the number of total laps in race: "))
+        input_data['LapTimes'] = float(input("Avg lap time from prev year (or estimate 98): "))
+        input_data['PitStopTimes'] = float(input("Enter pit stop time (0 if no pit stop): "))
+        input_data['PrevLap'] = float(input("Enter avg lap time differece (0-2) (0 if first lap): "))
+        # Collect race conditions
+        input_data['AvgSpeed'] = float(input("Enter average speed in km/h from prev year: "))
+        input_data['AirTemp_Cel'] = float(input("estimate air temperature in Celsius on race day: "))
+        input_data['TrackTemp_Cel'] = float(input("estimate track temperature in Celsius on race day: "))
+        input_data['Humidity'] = float(input("estimate the humidity percentage (0-100) on race day: "))
+        input_data['WindSpeed_km/h'] = float(input("estimate wind speed in km/h: "))
+        # Create a DataFrame with the input data
+        input_df = pd.DataFrame([input_data])
+        # If we have a test set, ensure our columns match the training data
+        if X_test is not None:
+            missing_cols = set(X_test.columns) - set(input_df.columns)
+            # Add any missing columns with 0s
+            for col in missing_cols:
+                input_df[col] = 0
+            # Ensure column order matches training data
+            input_df = input_df[X_test.columns]
+        # Make prediction
+        prediction = model.predict(input_df)
+        print(f"\nPredicted position: {int(round(prediction[0]))}")
+        return prediction[0]
+    except ValueError as e:
+        print(f"Error: Please enter valid numeric values. Details: {e}")
+        return None
+    except Exception as e:
+        print(f"An error occurred: {e}")
+        return None
+#-----linear regresssion------------
+x , y= read_data("b.csv")
+xtrain, xtest , ytrain, ytest = train_test_split(x,y,test_size = 0.3)
+model_1 = linear_reg(xtrain,ytrain)
+ypred = predict(model_1,xtest,ytest)
+#visvualize(ytest,ypred)
+#-----descision tree classifier-----
+x , y= read_data("b.csv")
+xtrain, xtest , ytrain, ytest = train_test_split(x,y,test_size = 0.3)
+model_2 = decsison_tree_classifier_method(xtrain,ytrain)
+parameter_grid= hyperamter_tuning_paramter_grid()
+tuned_model_2 = hyper_paramter_tuning(model_2,xtrain,ytrain,**parameter_grid)
+y_pred = predict(tuned_model_2,xtest,ytest)
+#visvualize(ytest,ypred)
+#----descision tree regressor-------
+x , y= read_data("b.csv")
+xtrain, xtest , ytrain, ytest = train_test_split(x,y,test_size = 0.3)
+model_3 = decision_tree_regressor_method()
+parameter_grid= hyperamter_tuning_paramter_grid()
+tuned_model_3 = hyper_paramter_tuning(model_3,xtrain,ytrain,**parameter_grid)
+y_pred= predict(tuned_model_3,xtest,ytest)
+# Ask user for input and predict position
+#predicted_position = ask_user(tuned_model_3, x_columns)
+predicted_position = ask_user(tuned_model_3, xtest)
+#pickle.dump(tuned_model_3.open('model.pkl','mb'))
+!pip install streamlit
+import streamlit as st
+import pickle
+import numpy as np
+model = pickle.load(open('model.pkl','rb'))
+def predictPos(TLaps,Laptime,Pit,Prev,AvgSpeed,AirTemp,TrackTemp,Humid,Wind):
+  input = np.array([ [TLaps,Laptime,Pit,Prev,AvgSpeed,AirTemp,TrackTemp,Humid,Wind]]).astype(np.float64)
+  prediction=model.predict(input)
+  return prediction[0]
+def main():
+  st.title("title")
+  html_temp="""
+  <div style = "background-color:#025244; padding :10px">
+  <h2 style = "color:white; text-align:center;"> Driver Position Prediction </h2>
+  </div>
+  """
+  st.markdown(html_temp, unsafe_allow_html=True)
+  TLaps = st.text_input("Enter the number of total laps in race: ","Type Here")
+  Laptime = st.text_input("Avg lap time from prev year (or estimate 98): ","Type Here")
+  Pit = st.text_input("Enter pit stop time (0 if no pit stop): ","Type Here")
+  Prev= st.text_input("Enter avg lap time differece (0-2) (0 if first lap): ","Type Here")
+  AvgSpeed = st.text_input("Enter average speed in km/h from prev year: ","Type Here")
+  AirTemp= st.text_input("estimate air temperature in Celsius on race day: ","Type Here")
+  TrackTemp = st.text_input("estimate track temperature in Celsius on race day: ","Type Here")
+  Humid = st.text_input("estimate the humidity percentage (0-100) on race day: ","Type Here")
+  Wind = st.text_input("estimate wind speed in km/h: ","Type Here")
+  safe_html="""
+    <div style="background-color:#F4D03F;padding:10px >
+    <h2 style="color:white;text-align:center;"> Your forest is safe</h2>
+    </div>
+    """
+  danger_html="""
+  <div style="background-color:#F08080;padding:10px >
+    <h2 style="color:black ;text-align:center;"> Your forest is in danger</h2>
+   </div>
+    """
+  if st.button("Predict"):
+    output=predictPos(TLaps,Laptime,Pit,Prev,AvgSpeed,AirTemp,TrackTemp,Humid,Wind)
+    st.success('The postion of driver is {}'.format(output))
+    # if output > 0.5:
+    #   st.markdown(danger_html,unsafe_allow_html=True)
+    # else:
+    #   st.markdown(safe_html,unsafe_allow_html=True)
+if __name__=='__main__':
+    main()