train.py

import os 
import sys
import random
import math
import numpy as np
import cv2

from imgaug import augmenters as iaa
import imgaug as ia
import glob
import pickle

import warnings 
warnings.filterwarnings("ignore")


#segmentation_train_dir="/root/ye/Data/Indian-Diabetic/Segmentation/Groundtruths/training/"
#original_train_dir="/root/ye/Data/Indian-Diabetic/Segmentation/Original-Images/training/"

#segmentation_val_dir="/root/ye/Data/Indian-Diabetic/Segmentation/Groundtruths/testing/"
#original_val_dir="/root/ye/Data/Indian-Diabetic/Segmentation/Original-Images/testing//"
#images_list=glob.glob(DATA_DIR+"*.tif")

WORK_DIR="./checkpoint"
WEIGHTS_PATH="../mask_rcnn_imagenet.h5"

height,width=2848,4288
LEARNING_RATE = 0.006


sys.path.append("..")
from mrcnn.config import Config
from mrcnn import utils
import mrcnn.model as modellib
from mrcnn import visualize
from mrcnn.model import log
from keras.callbacks import  LearningRateScheduler
import keras.backend as K


with open("./data/train-mask.pkl","rb") as msk:
    train_mask=pickle.load(msk)
    
    
with open("./data/val-mask.pkl","rb") as msk:
    val_mask=pickle.load(msk)


class DetectorConfig(Config):
    """Configuration for training pneumonia detection on the RSNA pneumonia dataset.
    Overrides values in the base Config class.
    """
    
    NAME="IDRiD"
    
    GPU_COUNT=1
    IMAGES_PER_GPU=1
    
    BACKBONE="resnet50"
    
    NUM_CLASSES=1+5 # background +1 pneumonia classes
    IMAGE_MIN_DIM=800
    IMAGE_MAX_DIM=1024
    RPN_ANCHOR_SCALES = (8, 16, 32, 64, 128)
    TRAIN_ROIS_PER_IMAGE =32
    LEARNING_RATE=0.00001
    WEIGHT_DECAY=0.002
    VALIDATION_STEPS=200
    STEPS_PER_EPOCH =15000

config=DetectorConfig()
config.display()

augmentation = iaa.SomeOf((0, 3), [
    iaa.Fliplr(0.5),
    iaa.Flipud(0.5),
    iaa.OneOf([iaa.Affine(rotate=90),
               iaa.Affine(rotate=180),
               iaa.Affine(rotate=270)],
             ),
    iaa.Affine(scale={"x": (0.8, 1.2), "y": (0.8, 1.2)}),
    iaa.Multiply((0.8, 1.5)),
    iaa.GaussianBlur(sigma=(0.0, 5.0))
])


sometimes = lambda aug: iaa.Sometimes(0.5, aug)
seq = iaa.Sequential(
    [
        # apply the following augmenters to most images
        iaa.Fliplr(0.5), # horizontally flip 50% of all images
        iaa.Flipud(0.2), # vertically flip 20% of all images
        # crop images by -5% to 10% of their height/width
        sometimes(iaa.CropAndPad(
            percent=(-0.05, 0.1),
            pad_mode=ia.ALL,
            pad_cval=(0, 255)
        )),
        sometimes(iaa.Affine(
            scale={"x": (0.8, 1.2), "y": (0.8, 1.2)}, # scale images to 80-120% of their size, individually per axis
            translate_percent={"x": (-0.2, 0.2), "y": (-0.2, 0.2)}, # translate by -20 to +20 percent (per axis)
            rotate=(-45, 45), # rotate by -45 to +45 degrees
            shear=(-16, 16), # shear by -16 to +16 degrees
            order=[0, 1], # use nearest neighbour or bilinear interpolation (fast)
            cval=(0, 255), # if mode is constant, use a cval between 0 and 255
            mode=ia.ALL # use any of scikit-image's warping modes (see 2nd image from the top for examples)
        )),
        # execute 0 to 5 of the following (less important) augmenters per image
        # don't execute all of them, as that would often be way too strong
        iaa.SomeOf((0, 5),
            [
                sometimes(iaa.Superpixels(p_replace=(0, 1.0), n_segments=(20, 200))), # convert images into their superpixel representation
                iaa.OneOf([
                    iaa.GaussianBlur((0, 3.0)), # blur images with a sigma between 0 and 3.0
                    iaa.AverageBlur(k=(2, 7)), # blur image using local means with kernel sizes between 2 and 7
                    iaa.MedianBlur(k=(3, 11)), # blur image using local medians with kernel sizes between 2 and 7
                ]),
                iaa.Sharpen(alpha=(0, 1.0), lightness=(0.75, 1.5)), # sharpen images
                iaa.Emboss(alpha=(0, 1.0), strength=(0, 2.0)), # emboss images
                # search either for all edges or for directed edges,
                # blend the result with the original image using a blobby mask
                iaa.SimplexNoiseAlpha(iaa.OneOf([
                    iaa.EdgeDetect(alpha=(0.5, 1.0)),
                    iaa.DirectedEdgeDetect(alpha=(0.5, 1.0), direction=(0.0, 1.0)),
                ])),
                iaa.AdditiveGaussianNoise(loc=0, scale=(0.0, 0.05*255), per_channel=0.5), # add gaussian noise to images
                iaa.OneOf([
                    iaa.Dropout((0.01, 0.1), per_channel=0.5), # randomly remove up to 10% of the pixels
                    iaa.CoarseDropout((0.03, 0.15), size_percent=(0.02, 0.05), per_channel=0.2),
                ]),
                iaa.Invert(0.05, per_channel=True), # invert color channels
                iaa.Add((-10, 10), per_channel=0.5), # change brightness of images (by -10 to 10 of original value)
                iaa.AddToHueAndSaturation((-20, 20)), # change hue and saturation
                # either change the brightness of the whole image (sometimes
                # per channel) or change the brightness of subareas
                iaa.OneOf([
                    iaa.Multiply((0.5, 1.5), per_channel=0.5),
                    iaa.FrequencyNoiseAlpha(
                        exponent=(-4, 0),
                        first=iaa.Multiply((0.5, 1.5), per_channel=True),
                        second=iaa.ContrastNormalization((0.5, 2.0))
                    )
                ]),
                iaa.ContrastNormalization((0.5, 2.0), per_channel=0.5), # improve or worsen the contrast
                iaa.Grayscale(alpha=(0.0, 1.0)),
                sometimes(iaa.ElasticTransformation(alpha=(0.5, 3.5), sigma=0.25)), # move pixels locally around (with random strengths)
                sometimes(iaa.PiecewiseAffine(scale=(0.01, 0.05))), # sometimes move parts of the image around
                sometimes(iaa.PerspectiveTransform(scale=(0.01, 0.1)))
            ],
            random_order=True
        )
    ],
    random_order=True
)


def step_decay(epoch):
    initial_lrate = config.LEARNING_RATE
    drop = 0.1
    epochs_drop = 10.0
    lrate = initial_lrate * math.pow(drop,  
           math.floor((1+epoch)/epochs_drop))
    return lrate

lrate = LearningRateScheduler(step_decay)


class DetectorDataset(utils.Dataset):
    """Dataset class for training pneumonia detection on the RSNA pneumonia dataset.
    """

    def __init__(self,image_annotations, orig_height, orig_width):
        super().__init__(self)
        
        #self.add_class("IDRiD",0,"BG")
        self.add_class("IDRiD",1,"Haemorrhages")
        self.add_class("IDRiD",2,"SoftExudates")
        self.add_class("IDRiD",3,"HardExudates")
        self.add_class('IDRiD',4,"Microaneurysms")
        self.add_class("IDRiD",5,"OpticDisc")
        self.label_dict={"BG":0,"Haemorrhages":1,"SoftExudates":2,"HardExudates":3,"Microaneurysms":4,"OpticDisc":5}
        # add images 
        for i, fp in enumerate(image_annotations):
            classes = fp["classes"]
            path=fp["path"]
            mask=fp["mask"]
            self.add_image('IDRiD', image_id=i, path=path, mask=mask,
                           classes=classes, orig_height=orig_height, orig_width=orig_width)
            
    def image_reference(self, image_id):
        assert image_id in self.image_ids
        info = self.image_info[image_id]
        return info['path']

    def load_image(self, image_id):
        info = self.image_info[image_id]
        fp = info['path']
        image=cv2.imread(fp)
        # If grayscale. Convert to RGB for consistency.
        if len(image.shape) != 3 or image.shape[2] != 3:
            image = np.stack((image,) * 3, -1)
        return image

    def load_mask(self, image_id):
        info = self.image_info[image_id]
        count=info["mask"].shape[-1]
        classes=info["classes"]
        
        class_ids = np.zeros((count), dtype=np.int32)
        #class_ids = np.array([self.class_names.index(s[0]) for s in classes])
        msk=info["mask"]
        for i,c in enumerate(classes):
            class_ids[i]=self.label_dict[c]
        return msk.astype(np.bool), class_ids.astype(np.int32)
 

dataset_train=DetectorDataset(image_annotations=train_mask,orig_height=height,orig_width=width)
dataset_train.prepare()

dataset_val=DetectorDataset(image_annotations=val_mask,orig_height=height,orig_width=width)
dataset_val.prepare()


model=modellib.MaskRCNN(mode='training',config=config,model_dir=WORK_DIR)
# Exclude the last layers because they require a matching
# number of classes
model.load_weights(WEIGHTS_PATH, by_name=True, exclude=[
    "mrcnn_class_logits", "mrcnn_bbox_fc",
    "mrcnn_bbox", "mrcnn_mask"])


## train heads with higher lr to speedup the learning
model.train(dataset_train, dataset_val,augmentation=seq,
            learning_rate=config.LEARNING_RATE,
            epochs=20,
            layers="5+")

history = model.keras_model.history.history