Digits-Classification-Project/app.py at main · xdnhatnguyen/Digits-Classification-Project · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
import gradio as gr
import torch
import torch.nn.functional as F
import numpy as np
import cv2

# FIX 1: Import your actual model class
from src.model import MLP, CNN

# LOAD MODEL
DEVICE = torch.device("cuda" if torch.cuda.is_available() else "cpu")
# Ensure this path matches exactly where main.py saved it
MODEL_PATHS = ["model/mnist_MLP.pt","model/mnist_CNN.pt"]
models = [MLP().to(DEVICE), CNN().to(DEVICE)]

def load_pytorch_model_from_file(idx):
    try:

        # FIX 3: Uncomment this to actually load the trained weights!
        # If you leave this commented out, you are predicting with a random, empty model.
        models[idx].load_state_dict(torch.load(MODEL_PATHS[idx], map_location=DEVICE))

        models[idx].eval()
        print(f"✅ Successfully loaded model from {MODEL_PATHS[idx]}")
        return models[idx]
    except Exception as e:
        print(f"⚠️ Error loading model: {e}")
        return None

# --- LOGIC XỬ LÝ BIẾN MODEL ---
models = [load_pytorch_model_from_file(idx) for idx in range(2)]

# ==========================================
# HÀM XỬ LÝ ẢNH & DỰ ĐOÁN
# ==========================================
def predict_digit(image, model_name):

    idx = 0
    if model_name == "CNN Model":
        idx = 1
    else:
        idx = 0

    # Handle Gradio 4.x dictionary input
    if isinstance(image, dict):
        image = image['composite']

    if image is None:
        return None

    # 1. Preprocessing
    if image.ndim == 3:
        if image.shape[-1] == 4:
            image = cv2.cvtColor(image, cv2.COLOR_RGBA2GRAY)
        elif image.shape[-1] == 3:
            image = cv2.cvtColor(image, cv2.COLOR_RGB2GRAY)

    image = cv2.resize(image, (28, 28))

    # Invert colors if needed (black background logic)
    if np.mean(image) > 127:
        image = 255 - image

    image = image.astype('float32') / 255.0
    image_tensor = torch.from_numpy(image).float()
    image_tensor = image_tensor.unsqueeze(0).unsqueeze(0)
    image_tensor = image_tensor.to(DEVICE)

    # 2. Inference
    if models[idx]:
        with torch.no_grad():
            output = models[idx](image_tensor)
            probabilities = F.softmax(output, dim=1)
            prob_arr = probabilities.cpu().numpy()[0]

        return {str(i): float(prob_arr[i]) for i in range(10)}
    else:
        return {"Error": 0.0}

# ==========================================
# GIAO DIỆN GRADIO
# ==========================================
demo = gr.Interface(
    fn=predict_digit,
    inputs=[gr.Sketchpad(label="Draw a digit"), gr.Radio(["MLP Model", "CNN Model"], label="Choose model")],
    outputs=gr.Label(num_top_classes=3, label="Prediction"),
    title="HCMUS-ConChoCaoBangBoPC: The World's number one AI Digit Recognizer",
    live=True
)

if __name__ == "__main__":
    demo.launch(share=True)