Spaces:

nssharmaofficial
/

RedEyeClassifier

Sleeping

App Files Files Community

nssharmaofficial commited on May 19, 2024

Commit

3bdf51a

1 Parent(s): 702d527

Add source code and saved weights

Browse files

Files changed (3) hide show

source/model.py +101 -0
source/predict_sample.py +52 -0
source/weights/CNN-B8-LR-0.01-E30.pt +3 -0

source/model.py ADDED Viewed

	@@ -0,0 +1,101 @@

+import torch.nn as nn
+import torch.nn.functional as F
+from dataset import get_paths, get_data_loader, Dataset
+from setup import Setup
+class CNN(nn.Module):
+    """
+    Convolutional Neural Network (CNN) for classifying 'normal' and 'red' eye images.
+    The network consists of four convolutional layers followed by two fully connected layers.
+    Each convolutional layer is followed by batch normalization and a LeakyReLU activation function.
+    A dropout layer is added before the final fully connected layer to prevent overfitting.
+    Attributes:
+        conv1 (nn.Sequential): First convolutional layer block.
+        conv2 (nn.Sequential): Second convolutional layer block.
+        conv3 (nn.Sequential): Third convolutional layer block.
+        conv4 (nn.Sequential): Fourth convolutional layer block.
+        fc1 (nn.Linear): First fully connected layer.
+        fc2 (nn.Linear): Second fully connected layer (output layer).
+        dropout (nn.Dropout): Dropout layer with a probability of 0.5.
+    """
+    def __init__(self):
+        super(CNN, self).__init__()
+        self.conv1 = nn.Sequential(
+            nn.Conv2d(3, 8, 4, stride=2, padding=1),
+            nn.BatchNorm2d(8),
+            nn.LeakyReLU(0.2, inplace=True)
+        )
+        self.conv2 = nn.Sequential(
+            nn.Conv2d(8, 16, 4, stride=2, padding=1),
+            nn.BatchNorm2d(16),
+            nn.LeakyReLU(0.2, inplace=True)
+        )
+        self.conv3 = nn.Sequential(
+            nn.Conv2d(16, 32, 4, stride=2, padding=1),
+            nn.BatchNorm2d(32),
+            nn.LeakyReLU(0.2, inplace=True)
+        )
+        self.conv4 = nn.Sequential(
+            nn.Conv2d(32, 64, 4, stride=2, padding=1),
+            nn.BatchNorm2d(64),
+            nn.LeakyReLU(0.2, inplace=True)
+        )
+        self.fc1 = nn.Linear(64 * 2 * 2, 32)
+        self.fc2 = nn.Linear(32, 2)
+        self.dropout = nn.Dropout(0.5)
+    def forward(self, x):
+        """
+        Defines the forward pass of the CNN.
+        Args:
+            x (torch.Tensor): Input tensor of shape (batch_size, 3, 32, 32).
+        Returns:
+            torch.Tensor: Output tensor of shape (batch_size, 2).
+        """
+        # print('\nOriginal: ', x.size())
+        x = self.conv1(x)
+        # print('Conv1: ', x.size())
+        x = self.conv2(x)
+        # print('Conv2: ', x.size())
+        x = self.conv3(x)
+        # print('Conv3: ', x.size())
+        x = self.conv4(x)
+        # print('Conv4: ', x.size())
+        x = x.view(x.size(0), -1)
+        x = F.leaky_relu(self.fc1(x))
+        x = self.dropout(x)
+        x = self.fc2(x)
+        # print('Out: ', x.size())
+        return F.log_softmax(x, dim=1)
+if __name__ == '__main__':
+    """
+    Main script to initialize the setup, load datasets, create DataLoader,
+    instantiate the CNN model, and display the number of trainable parameters
+    and the output size for a batch of images.
+    """
+    setup = Setup()
+    normal_train_paths, red_train_paths, normal_test_paths, red_test_paths = get_paths()
+    train_dataset = Dataset(red_train_paths, normal_train_paths)
+    train_loader = get_data_loader(train_dataset, batch_size=setup.BATCH)
+    imgs, labels = next(iter(train_loader))
+    cnn = CNN()
+    print(f'Number of trainable parameters in CNN: {sum(p.numel() for p in cnn.parameters() if p.requires_grad)}')
+    output = cnn.forward(imgs)
+    # Print info
+    print('\nBatch size: ', setup.BATCH)
+    print('Images size: ', imgs.size())         # (batch, 3, 32, 32)
+    print('CNN output size: ', output.size())   # (batch, 2)

source/predict_sample.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from torchvision import transforms
+import torch
+import torch.utils.data
+from PIL import Image
+from source.model import CNN
+def classify_eye(image: torch.Tensor,
+                 model: CNN) -> str:
+    """
+    Generate caption of a single image of size (3, 224, 224).
+    Generating of caption starts with <sos>, and each next predicted word ID
+    is appended for the next LSTM input until the sentence reaches MAX_LENGTH or <eos>.
+    Returns:
+        list[str]: caption for given image
+    """
+    # image: (3, 32, 32)
+    image = image.unsqueeze(0)
+    # image: (1, 3, 32, 32)
+    output = model.forward(image)
+    _, prediction = torch.max(output, dim=1)
+    if prediction == 0:
+        output = 'Normal'
+    elif prediction == 1:
+        output = 'Red'
+    return output
+def main_classification(image):
+    image = Image.fromarray(image.astype('uint8'), 'RGB')
+    transform = transforms.Compose([
+        transforms.Resize((32, 32)),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.5, 0.5, 0.5], std=[0.5, 0.5, 0.5])
+        ])
+    image = transform(image)
+    image = image.to(torch.device("cpu"))
+    cnn = CNN().to(torch.device("cpu"))
+    cnn.eval()
+    cnn.load_state_dict(torch.load(f='weights/CNN-B8-LR-0.01-E30.pt', map_location=torch.device("cpu")))
+    prediction_outcome = classify_eye(image, cnn)
+    return prediction_outcome

source/weights/CNN-B8-LR-0.01-E30.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f9fb3f4e01f9420578b5e55c4975a5a5b3574e1b54d15d448ca9120a244eba9f
+size 219842