Spaces:

quantumbit
/

mnist-classifier-api

Sleeping

App Files Files Community

quantumbit commited on Mar 30

Commit

7e18445

verified ·

1 Parent(s): 06aff79

Upload 7 files

Browse files

Files changed (7) hide show

Dockerfile +10 -0
app.py +232 -0
models/mnist_cnn_model.h5 +3 -0
models/mnist_logistic_regression.pkl +3 -0
models/mnist_random_forest.pkl +3 -0
models/mnist_svm.pkl +3 -0
requirements.txt +0 -0

Dockerfile ADDED Viewed

	@@ -0,0 +1,10 @@

+FROM python:3.10-slim
+WORKDIR /app
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+COPY . .
+CMD ["gunicorn", "--bind", "0.0.0.0:7860", "app:app"]

app.py ADDED Viewed

	@@ -0,0 +1,232 @@

+from flask import Flask, request, jsonify
+import numpy as np
+import tensorflow as tf
+from PIL import Image
+import io
+import base64
+import re
+import joblib
+import os
+app = Flask(__name__)
+# Ensure the "images" directory exists
+IMAGE_DIR = "images"
+if not os.path.exists(IMAGE_DIR):
+    os.makedirs(IMAGE_DIR)
+# Load all models - use absolute paths for Hugging Face
+MODEL_DIR = os.path.join(os.getcwd(), "models")
+models = {
+    "cnn": tf.keras.models.load_model(os.path.join(MODEL_DIR, "mnist_cnn_model.h5")),
+    "svm": joblib.load(os.path.join(MODEL_DIR, "mnist_svm.pkl")),
+    "logistic": joblib.load(os.path.join(MODEL_DIR, "mnist_logistic_regression.pkl")),
+    "random_forest": joblib.load(os.path.join(MODEL_DIR, "mnist_random_forest.pkl"))
+}
+# [Keep your existing classification_reports, preprocess_image,
+# and create_simulated_scores functions exactly as they are]
+# Classification reports for each model
+classification_reports = {
+    "cnn": """
+               precision    recall  f1-score   support
+           0       0.99      1.00      0.99       980
+           1       1.00      1.00      1.00      1135
+           2       0.99      0.99      0.99      1032
+           3       0.99      1.00      0.99      1010
+           4       1.00      0.99      0.99       982
+           5       0.98      0.99      0.99       892
+           6       1.00      0.98      0.99       958
+           7       0.99      0.99      0.99      1028
+           8       1.00      0.99      0.99       974
+           9       0.99      0.99      0.99      1009
+    accuracy                           0.99     10000
+   macro avg       0.99      0.99      0.99     10000
+weighted avg       0.99      0.99      0.99     10000
+    """,
+    "svm": """
+               precision    recall  f1-score   support
+           0     0.9874    0.9896    0.9885      1343
+           1     0.9882    0.9925    0.9903      1600
+           2     0.9706    0.9819    0.9762      1380
+           3     0.9783    0.9749    0.9766      1433
+           4     0.9777    0.9822    0.9800      1295
+           5     0.9827    0.9796    0.9811      1273
+           6     0.9858    0.9921    0.9889      1396
+           7     0.9768    0.9807    0.9788      1503
+           8     0.9813    0.9683    0.9748      1357
+           9     0.9807    0.9669    0.9738      1420
+    accuracy                         0.9810     14000
+   macro avg     0.9809    0.9809    0.9809     14000
+weighted avg     0.9810    0.9810    0.9810     14000
+    """,
+    "random_forest": """
+               precision    recall  f1-score   support
+           0     0.9844    0.9866    0.9855      1343
+           1     0.9831    0.9831    0.9831      1600
+           2     0.9522    0.9674    0.9597      1380
+           3     0.9579    0.9532    0.9556      1433
+           4     0.9617    0.9699    0.9658      1295
+           5     0.9707    0.9631    0.9669      1273
+           6     0.9800    0.9828    0.9814      1396
+           7     0.9668    0.9681    0.9674      1503
+           8     0.9599    0.9528    0.9564      1357
+           9     0.9566    0.9465    0.9515      1420
+    accuracy                         0.9675     14000
+   macro avg     0.9673    0.9674    0.9673     14000
+weighted avg     0.9675    0.9675    0.9675     14000
+    """,
+    "logistic": """
+               precision    recall  f1-score   support
+           0     0.9636    0.9650    0.9643      1343
+           1     0.9433    0.9675    0.9553      1600
+           2     0.9113    0.8935    0.9023      1380
+           3     0.9021    0.8939    0.8980      1433
+           4     0.9225    0.9290    0.9257      1295
+           5     0.8846    0.8790    0.8818      1273
+           6     0.9420    0.9534    0.9477      1396
+           7     0.9273    0.9421    0.9347      1503
+           8     0.8973    0.8696    0.8832      1357
+           9     0.9019    0.9000    0.9010      1420
+    accuracy                         0.9204     14000
+   macro avg     0.9196    0.9193    0.9194     14000
+weighted avg     0.9201    0.9204    0.9202     14000
+    """
+}
+# Preprocess image before prediction
+def preprocess_image(image, model_type):
+    image = image.resize((28, 28)).convert('L')  # Convert to grayscale
+    img_array = np.array(image) / 255.0  # Normalize
+    if model_type == "cnn":
+        # CNN expects 4D tensor with channel dimension
+        return np.expand_dims(np.expand_dims(img_array, axis=0), axis=-1)
+    else:
+        # Other models expect flattened 1D array
+        return img_array.flatten().reshape(1, -1)
+@app.route('/')
+def home():
+    return jsonify({
+        "message": "MNIST Classifier API",
+        "available_models": list(models.keys()),
+        "endpoints": {
+            "/predict": "POST - Send image and model_type",
+            "/get_classification_report": "POST - Get model metrics"
+        }
+    })
+# [Keep your existing /get_classification_report and /predict routes exactly as they are]
+@app.route('/get_classification_report', methods=['POST'])
+def get_classification_report():
+    model_type = request.json['model_type']
+    if model_type in classification_reports:
+        return jsonify({
+            'report': classification_reports[model_type]
+        })
+    return jsonify({'error': 'Model not found'})
+@app.route('/predict', methods=['POST'])
+def predict():
+    if request.method == 'POST':
+        data = request.json['image']
+        model_type = request.json['model_type']
+        img_data = re.sub('^data:image/png;base64,', '', data)
+        img = Image.open(io.BytesIO(base64.b64decode(img_data)))
+        # Save the image to "images" folder
+        image_path = os.path.join(IMAGE_DIR, "digit.png")
+        img.save(image_path)
+        # Preprocess image and predict
+        processed_image = preprocess_image(img, model_type)
+        if model_type in models:
+            model = models[model_type]
+            # Model-specific prediction logic
+            if model_type == "cnn":
+                # For CNN, use softmax probabilities
+                prediction = model.predict(processed_image)
+                predicted_digit = np.argmax(prediction)
+                confidence_scores = prediction[0].tolist()
+                score_type = "probability"
+            elif model_type == "svm":
+                # For SVM, use decision function distances
+                predicted_digit = model.predict(processed_image)[0]
+                # Try to get decision function scores
+                if hasattr(model, "decision_function") and callable(getattr(model, "decision_function")):
+                    try:
+                        # Get raw decision scores
+                        decision_scores = model.decision_function(processed_image)
+                        # One-vs-One SVMs have a different shape for decision_function output
+                        if len(decision_scores.shape) == 2:
+                            # This is a standard one-vs-rest SVM, shape should be (1, n_classes)
+                            confidence_scores = decision_scores[0].tolist()
+                        else:
+                            # One-vs-One SVM returns pairwise comparisons
+                            # Convert to a simplified score per class (this is an approximation)
+                            confidence_scores = [0] * 10
+                            for i in range(10):
+                                # Count how many times class i wins in pairwise comparisons
+                                confidence_scores[i] = sum(1 for score in decision_scores[0] if score > 0)
+                        # Normalize scores to positive values for visualization
+                        min_score = min(confidence_scores)
+                        if min_score < 0:
+                            confidence_scores = [score - min_score for score in confidence_scores]
+                        score_type = "decision_distance"
+                    except (AttributeError, NotImplementedError) as e:
+                        print(f"Error getting decision function: {e}")
+                        confidence_scores = create_simulated_scores(int(predicted_digit))
+                        score_type = "simulated"
+                else:
+                    # Fallback if decision_function is not available
+                    confidence_scores = create_simulated_scores(int(predicted_digit))
+                    score_type = "simulated"
+            else:
+                # For other models (Random Forest, Logistic Regression)
+                predicted_digit = model.predict(processed_image)[0]
+                # Try to get probability estimates
+                if hasattr(model, "predict_proba") and callable(getattr(model, "predict_proba")):
+                    try:
+                        confidence_scores = model.predict_proba(processed_image)[0].tolist()
+                        score_type = "probability"
+                    except (AttributeError, NotImplementedError):
+                        confidence_scores = create_simulated_scores(int(predicted_digit))
+                        score_type = "simulated"
+                else:
+                    confidence_scores = create_simulated_scores(int(predicted_digit))
+                    score_type = "simulated"
+            return jsonify({
+                'digit': int(predicted_digit),
+                'confidence_scores': confidence_scores,
+                'score_type': score_type
+            })
+        return jsonify({'error': 'Model not found'})
+def create_simulated_scores(predicted_digit):
+    """Create simulated confidence scores that sum to 1.0 with highest probability for the predicted digit."""
+    # Assign base probabilities
+    scores = [0.01] * 10  # Give each digit a small base probability
+    # Calculate remaining probability (should be around 0.9)
+    remaining = 1.0 - sum(scores)
+    # Assign the remaining probability to the predicted digit
+    scores[predicted_digit] += remaining
+    return scores
+if __name__ == '__main__':
+    app.run(host='0.0.0.0', port=7860)  # Hugging Face uses port 7860

models/mnist_cnn_model.h5 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4f31254d7c3f1c601d4f9e9dac7412af3a4121207e861d046b271e52628c3c41
+size 782992

models/mnist_logistic_regression.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:49a1943a9c672caace5d1af724f439b1176bb04cebec1df27fed35dca6e10054
+size 63639

models/mnist_random_forest.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bd2a6d25c6a2c3869951fde30cc8687407dae809310aa52ec8b632c100885b1
+size 101529065

models/mnist_svm.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:35038ec8695cb4d2364138f19d2f6d1709818f4bea9491b3811b89035ae3bc9f
+size 66700155

requirements.txt ADDED Viewed

Binary file (7.54 kB). View file