'''Load PyTorch and necessary libraries.'''

import torch
import torch.nn as nn
from torch.utils.data import DataLoader
import torch.nn.functional as F

import torchvision
import torchvision.datasets as datasets
from torchvision import models
import torchvision.transforms as transforms

import os
from pathlib import Path
import Augmentor
from IPython.display import Image, display
import splitfolders
import matplotlib.pyplot as plt
import numpy as np
import time
from sklearn.metrics import f1_score, precision_score, recall_score, classification_report
import seaborn as sns
import pandas as pd
from PIL import Image
dir = os.getcwd()

dir = os.getcwd()
p = Augmentor.Pipeline(os.path.join(dir, 'preXrayData/covid'))
p.rotate(probability=0.7, max_left_rotation=10, max_right_rotation=10) # Rotate 70% of the images between 10 and -10 degrees
p.random_distortion(probability=1, grid_width=4, grid_height=4, magnitude=8) # Randomly distort the images while maintaining their aspect ratio
p.flip_left_right(probability=1) # Mirror the images from left to right
p.process()
p.sample(580)

Initialised with 4999 image(s) found.

Processing <PIL.Image.Image image mode=L size=3050x2539 at 0x7F103893BF40>: 100%|██████████| 4999/4999 [06:11<00:00, 13.46 Samples/s]   
Processing <PIL.Image.Image image mode=L size=299x299 at 0x7F0FFC56D810>: 100%|██████████| 580/580 [00:49<00:00, 11.61 Samples/s]

'''Visualize augmented image.'''

aug_img_path = 'preXrayData/covid/covid_original_COVID-597.png_b8c0f5bb-77e0-4749-9359-d746af324bcb.png'
display(Image.open(aug_img_path))

'''Move additional generated images into correct folder.'''

src_path = os.path.join(dir, 'preXrayData/covid/output')
for each_file in Path(src_path).glob('*.*'): # grabs all files
    tar_path = each_file.parent.parent
    each_file.rename(tar_path.joinpath(each_file.name))
os.remove(src_path)

'''Split the training and validation data.'''

data = os.path.join(dir, 'preXrayData')
splitfolders.ratio(data, output='postXrayData', seed=1337, ratio=(0.8,0.2))

Copying files: 20578 files [00:10, 1920.93 files/s]

'''Image transformation and normalization so the input data matches the model's expectations.'''

train_pathname = os.path.join(dir, 'postXrayData/train') # Contains 80% of the data
val_pathname = os.path.join(dir, 'postXrayData/val')     # Contains 20% of the data

# Transform pipeline to ensure input data is prepared in the same way as the original training data for the model
train_transform = transforms.Compose([
        transforms.RandomResizedCrop(299),
        transforms.RandomHorizontalFlip(),
        transforms.ToTensor(),
        transforms.Normalize((0.5,), (0.5,))  # Images are greyscale
])
val_transform = transforms.Compose([
        transforms.Resize((299, 299)),
        transforms.ToTensor(),
        transforms.Normalize((0.5,), (0.5,))
])

train_data = datasets.ImageFolder(train_pathname, train_transform)
val_data = datasets.ImageFolder(val_pathname, val_transform)

batch_size = 8 # Mini-batches of 8 samples at a time

# Dataloaders pass the data through the transform pipelines
train_loader = DataLoader(train_data, 
                          batch_size=batch_size, 
                          shuffle=True)
val_loader = DataLoader(val_data, 
                        batch_size=batch_size, 
                        shuffle=True)

'''Display labelled, transformed images.'''

def imshow(img, title):
    img = torchvision.utils.make_grid(img, normalize=True)
    npimg = img.numpy()
    fig = plt.figure(figsize=(10, 30))
    plt.imshow(np.transpose(npimg, (1, 2, 0)))
    plt.title(title)
    plt.axis('off')
    plt.show()

dataiter = iter(train_loader)
images, labels = next(dataiter)

imshow(images, [train_data.classes[i] for i in labels])

'''Define the model and parameters.'''

model = models.inception_v3(pretrained=True)

for param in model.parameters():
    param.requires_grad = False

# Define the custom final layer
model.fc = nn.Sequential(
    nn.Linear(model.fc.in_features, 128),
    nn.ReLU(),
    nn.Linear(128, 64),
    nn.ReLU(),
    nn.Dropout(p=0.5),
    nn.Linear(64, 3),
    nn.Softmax()
)

device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")
print("Device: " + str(device))
model = model.to(device)

num_epochs = 15     # The number of complete passes through the training dataset
batch_size = 8      # The number of samples processed before the model is updated
learn_rate = 0.001  # Determines the step size while moving toward a min of a loss function

UserWarning: The parameter 'pretrained' is deprecated since 0.13 and may be removed in the future, please use 'weights' instead.

Device: cuda:0

# Use the cross-entropy loss function to measure loss (the difference between the discovered and predicted distribution)
criterion = torch.nn.CrossEntropyLoss()

# Adam optimization is used in place of classical stochastic gradient descent to update the network weights (speeds up gradient descent by considering the exponenentially weighted average of the gradients)
optimizer = torch.optim.Adam(model.parameters(), 
                             lr=learn_rate, 
                             weight_decay=learn_rate / num_epochs)

'''Function to plot the accuracy and loss while training.'''

def plot_accuracy_loss(train_losses, val_losses, train_acc, val_acc, num_epochs):
    sns.set_style('darkgrid')
    sns.set_palette("mako")
    fig, ax = plt.subplots(1, 2, figsize=(10, 5), tight_layout=True)
    data = {'Epochs': list(range(1, num_epochs + 1)), 'Train Loss': train_losses, 'Val Loss': val_losses,
            'Train Accuracy': train_acc, 'Val Accuracy': val_acc}
    df = pd.DataFrame(data)
    
    # Losses
    sns.lineplot(data=df, x="Epochs", y="Train Accuracy", color='C1', ax=ax[0])
    sns.lineplot(data=df, x="Epochs", y="Val Accuracy", color='C4', ax=ax[0])
    ax[0].set_ylabel("Accuracy")
    ax[0].set_xlabel("Epoch")
    ax[0].set_xlim(1, num_epochs)
    ax[0].set_xticks(range(1, num_epochs + 1))
    ax[0].legend(labels=["Train Acc", "Val Acc"])

    # Accuracies
    sns.lineplot(data=df, x="Epochs", y="Train Loss", color='C1', ax=ax[1])
    sns.lineplot(data=df, x="Epochs", y="Val Loss", color='C4', ax=ax[1])
    ax[1].set_ylabel("Loss")
    ax[1].set_xlabel("Epoch")
    ax[1].set_xlim(1, num_epochs)
    ax[1].set_xticks(range(1, num_epochs + 1))
    ax[1].legend(labels=["Train Loss", "Val Loss"])

    fig.suptitle('Inception-v3')
    plt.show()

'''Function to train the model.'''

def train_model(model, criterion, optimizer, num_epochs, train_loader, val_loader,
                device, dataset_sizes, class_names):
    since = time.time()

    train_losses = []
    val_losses = []
    train_acc = []
    val_acc = []

    for epoch in range(num_epochs):
        print('Epoch {}/{}'.format(epoch + 1, num_epochs))
        print('-' * 10)

        for phase in ['train', 'val']:
            if phase == 'train':
                model.train()
                loader = train_loader
            else:
                model.eval()
                loader = val_loader

            running_loss = 0.0
            running_true = 0

            y_true, y_pred = [], []

            # Iterate over the data
            for inputs, labels in loader:
                inputs = inputs.to(device)
                labels = labels.to(device)

                optimizer.zero_grad() # Sets the gradients of all optimized tensors to zero

                # Only track history when training
                with torch.set_grad_enabled(phase == 'train'):
                    if phase == 'train':
                        # Forward pass --> calculating loss from model outputs
                        outputs, aux_outputs = model(inputs)

                        # Inception has an auxiliary output --> while training we calculate loss by summing final & auxiliary output
                        loss1 = criterion(outputs, labels)
                        loss2 = criterion(aux_outputs, labels)
                        loss = loss1 + 0.4 * loss2
                    else:
                        outputs = model(inputs)
                        loss = criterion(outputs, labels)

                    _, preds = torch.max(outputs, 1)
                    y_true.append(labels)
                    y_pred.append(preds)

                    # Backward pass --> updating weights with Adam optimizer
                    if phase == 'train':
                        loss.backward()
                        optimizer.step()

                    # Some stats
                    running_loss += loss.item() * inputs.size(0)
                    running_true += torch.sum(preds == labels.data)

            # More stats
            y_true, y_pred = torch.cat(y_true), torch.cat(y_pred)
            epoch_loss = running_loss / dataset_sizes[phase]
            epoch_acc = running_true.double() / dataset_sizes[phase]
            total_loss = np.sum(running_loss) / y_true.size(0)
            if phase == 'train':
                train_losses.append(epoch_loss)
                train_acc.append(epoch_acc.item())
            if phase == 'val':
                val_losses.append(epoch_loss)
                val_acc.append(epoch_acc.item())

            # Output stats each epoch
            print('{} loss: {:.4f}, {} accuracy: {:.4f}'.format(phase, total_loss, phase, epoch_acc))
            precision = precision_score(y_true.cpu(), y_pred.cpu(), average='macro')
            recall = recall_score(y_true.cpu(), y_pred.cpu(), average='macro')
            print('{} precision: {:.4f}, {} recall: {:.4f}'.format(phase, precision, phase, recall))
            f1 = f1_score(y_true.cpu(), y_pred.cpu(), average='macro')
            print('{} F1 score: {:.4f}'.format(phase, f1))
            print('Support: ')
            print(classification_report(y_true.cpu(), y_pred.cpu(), target_names=class_names))
        print()

    time_elapsed = time.time() - since
    print('Training complete in {:.0f}m {:.0f}s'.format(time_elapsed // 60, time_elapsed % 60))
    print()
    print('Train Lists')
    print(train_losses)
    print(train_acc)
    print('Val Lists')
    print(val_losses)
    print(val_acc)

    # Plot the accuracy and loss
    plot_accuracy_loss(train_losses, val_losses, train_acc, val_acc, num_epochs)

    return model

'''Train the model.'''

dataset_sizes = {'train': len(train_data), 'val': len(val_data)}
class_names = train_data.classes

model = train_model(model, criterion, optimizer, 
                    num_epochs, train_loader, val_loader, 
                    device, dataset_sizes, class_names)

Epoch 1/15
----------

UserWarning: Implicit dimension choice for softmax has been deprecated. Change the call to include dim=X as an argument.


  train loss: 4.2332, train accuracy: 0.6474
  train precision: 0.6456, train recall: 0.6474
  train F1 score: 0.6453
  Support: 
                precision    recall  f1-score   support
  
          covid       0.68      0.75      0.71      3999
         normal       0.63      0.57      0.60      4000
      pneumonia       0.63      0.62      0.62      4000
  
       accuracy                           0.65     11999
      macro avg       0.65      0.65      0.65     11999
   weighted avg       0.65      0.65      0.65     11999

  val loss: 0.7320, val accuracy: 0.8187
  val precision: 0.8379, val recall: 0.8187
  val F1 score: 0.8175
  Support: 
                precision    recall  f1-score   support
  
         covid       0.81      0.95      0.88      1000
        normal       0.72      0.81      0.77      1000
     pneumonia       0.97      0.69      0.81      1000
  
      accuracy                           0.82      3000
     macro avg       0.84      0.82      0.82      3000
  weighted avg       0.84      0.82      0.82      3000


Epoch 5/15
----------

UserWarning: Implicit dimension choice for softmax has been deprecated. Change the call to include dim=X as an argument.



train loss: 4.1726, train accuracy: 0.7157
train precision: 0.7149, train recall: 0.7157
train F1 score: 0.7144
Support: 
              precision    recall  f1-score   support

       covid       0.73      0.80      0.76      3999
      normal       0.70      0.65      0.68      4000
   pneumonia       0.71      0.69      0.70      4000

    accuracy                           0.72     11999
   macro avg       0.71      0.72      0.71     11999
weighted avg       0.71      0.72      0.71     11999

val loss: 0.7137, val accuracy: 0.8373
val precision: 0.8505, val recall: 0.8373
val F1 score: 0.8363
Support: 
              precision    recall  f1-score   support

       covid       0.76      0.97      0.86      1000
      normal       0.84      0.75      0.79      1000
   pneumonia       0.95      0.79      0.86      1000

    accuracy                           0.84      3000
   macro avg       0.85      0.84      0.84      3000
weighted avg       0.85      0.84      0.84      3000



Epoch 10/15
----------

UserWarning: Implicit dimension choice for softmax has been deprecated. Change the call to include dim=X as an argument.

'''Visualize some of the model predictions.'''

def get_image(path):
    '''Display images.'''
    with open(os.path.abspath(path), 'rb') as f:
        with Image.open(f) as img:
            return img.convert('RGB')

classes = ["Covid", "Normal", "Pneumonia"]
pathname = os.path.join(dir, 'LIMEImages')
input_imgs = datasets.ImageFolder(pathname, val_transform)

val_loader = DataLoader(input_imgs, 
                        batch_size=batch_size, 
                        shuffle=False)

dataiter = iter(val_loader)
images, labels = next(dataiter)

outputs = model(images.cuda())
_, predicted = torch.max(outputs.data, 1)
probs = F.softmax(outputs, dim=1).cpu().detach().numpy()

img_pred_labels = []
for j in range(3):
    img_pred_labels.append(classes[predicted[j]])

img_paths = ['LIMEImages/covid/COVID-12.png', 
             'LIMEImages/normal/IM-0031-0001.jpeg', 
             'LIMEImages/pneumonia/person1_virus_12.jpeg']

plt.figure()
f, axarr = plt.subplots(1,3,figsize=(15,15))
f.subplots_adjust(wspace=0.5)

for n in range(3):
    axarr[n].imshow(get_image(os.path.join(dir, img_paths[n])))
    axarr[n].xaxis.set_tick_params(labelbottom=False)
    axarr[n].yaxis.set_tick_params(labelleft=False)
    axarr[n].set_xticks([])
    axarr[n].set_yticks([])
    axarr[n].set_title("Predicted label:{}\nTrue label:{}".format(classes[predicted[n]], classes[n]))

def get_image(path):
    with open(os.path.abspath(path), 'rb') as f:
        with Image.open(f) as img:
            return img.convert('RGB') 
        
img = get_image(os.path.join(dir, img_paths[0]))
plt.imshow(img)

def get_pil_transform(): 
    transf = transforms.Compose([
        transforms.Resize((256, 256)),
        transforms.CenterCrop(224)
    ])    

    return transf   

pill_transf = get_pil_transform()

def get_preprocess_transform():
    normalize = transforms.Normalize(mean=[0.485, 0.456, 0.406],
                                    std=[0.229, 0.224, 0.225])     
    transf = transforms.Compose([
        transforms.ToTensor(),
        normalize
    ])    

    return transf 

preprocess_transform = get_preprocess_transform()

def batch_predict(images):
    model.eval()
    batch = torch.stack(tuple(preprocess_transform(i) for i in images), dim=0)

    device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
    model.to(device)
    batch = batch.to(device)
    
    logits = model(batch)
    probs = F.softmax(logits, dim=1)
    return probs.detach().cpu().numpy()

from lime import lime_image

explainer = lime_image.LimeImageExplainer()
explanation = explainer.explain_instance(np.array(pill_transf(img)), 
                                         batch_predict,
                                         top_labels=3,
                                         hide_color=0,
                                         num_samples=1000)

from skimage.segmentation import mark_boundaries

temp, mask = explanation.get_image_and_mask(explanation.top_labels[0], positive_only=True, num_features=3, hide_rest=False)
img_boundry1 = mark_boundaries(temp/255.0, mask)
plt.imshow(img_boundry1)

temp, mask = explanation.get_image_and_mask(explanation.top_labels[0], positive_only=False, num_features=5, hide_rest=False)
img_boundry2 = mark_boundaries(temp/255.0, mask)
plt.imshow(img_boundry2)

ind = explanation.top_labels[0]
dict_heatmap = dict(explanation.local_exp[ind])
heatmap = np.vectorize(dict_heatmap.get)(explanation.segments)

plt.imshow(heatmap, cmap = 'RdBu', vmin = -heatmap.max(), vmax = heatmap.max())

COVID-19 Detection from Chest X-rays Using Transfer Learning¶

Problem Statement¶

Data Collection and Augmentation¶

The Model¶

Why InceptionV3?¶

Why Transfer Learning?¶

Model Architecture¶

Results¶

Model Impact¶

Deployment¶

Model Interpretation¶

Future Work¶

Citations¶