imageLoader.py

# -*- coding: utf-8 -*-
'''
Copyright 2017 Mads Dyrmann

Permission is hereby granted, free of charge, to any person obtaining a copy of
this software and associated documentation files (the "Software"), to deal in
the Software without restriction, including without limitation the rights to
use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies
of the Software, and to permit persons to whom the Software is furnished to do
so, subject to the following conditions:

The above copyright notice and this permission notice shall be included in all
copies or substantial portions of the Software.

THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
SOFTWARE.
'''

'''
Verision History:

Ver 1.1.5: 2017-09-11: Specified datatype for onehot labels and images as int32 and float32, respectively.
Ver 1.1.6: 2017-10-05: Code structuring. Initial support for label-images for use with semantic segmentation

#TODO: Support for image and label pairs like e.g. VOC or semantic segmentation
#TODO: Support for defining train, test and val splits
'''

import numpy as np
from skimage import io, transform
import os


class imageLoader:
    def __init__(self):
        self.inputs = []
        self.targets = []
        self.nSamples = 0
        self.imagesize = (256, 256, 3)
        self.targetsNumerical = []
        self.targetsNumericalStrings=[]
        self.targetsOneHot = []
        self.labelsDict = {}
        self.numericalDictionary = None
        self.nClasses = []
        self.inputpath = ''
        self.__version__ = '1.1.7'


    """
    #Generator, which loops over a list of paths to files
    def iterate_minibatchesList(self, batchsize, shuffle=False, returnstyle='numerical'):
        assert len(self.inputs) == len(self.targets)

        import warnings
        warnings.warn('Not tested yet! Please report any unintende behaviour')

        if shuffle:
            indices = np.arange(len(self.inputs))
            np.random.shuffle(indices)
        for start_idx in range(0, len(self.inputs) - batchsize + 1, batchsize):
            if shuffle:
                excerpt = indices[start_idx:start_idx + batchsize]
            else:
                excerpt = slice(start_idx, start_idx + batchsize)
            x=[self.inputs[ix] for ix  in excerpt]
            yield x, self.getLabelbatch(excerpt=excerpt, returnstyle=returnstyle)


    #Generator, which loops over a images of paths to files
    def iterate_minibatchesImage(self, batchsize, shuffle=False, returnstyle='numerical', zeromean=False, normalize=False):
        assert len(self.inputs) == len(self.targets)
        if shuffle:
            indices = np.arange(len(self.inputs))
            np.random.shuffle(indices)
        for start_idx in range(0, len(self.inputs) - batchsize + 1, batchsize):
            if shuffle:
                excerpt = indices[start_idx:start_idx + batchsize]
                inputs = [self.inputs[x] for x in excerpt]
            else:
                excerpt = slice(start_idx, start_idx + batchsize)
                inputs = self.inputs[excerpt]

            x = np.empty((batchsize,)+self.imagesize,dtype=np.float32)
            for ix, filename in enumerate(inputs):
                im = io.imread(filename)
                x[ix, :] = transform.resize(im, self.imagesize).astype(np.float32)
            if zeromean:
                x=x-127
            if normalize:
                x=x/255.0
            yield x, self.getLabelbatch(excerpt=excerpt, returnstyle=returnstyle)

    """


    #Generator, which loops over a images of paths to files
    def iterate_minibatches(self, batchsize, shuffle=False, labelstyle='numerical', datastyle='image', zeromean=False, normalize=False, resize=False, preprocessor=None, startOverAfterFinished=False):
        assert len(self.inputs) == len(self.targets)
        if shuffle:
            indices = np.arange(len(self.inputs))
            np.random.shuffle(indices)

        while True:
            for start_idx in range(0, len(self.inputs) - batchsize + 1, batchsize):
                if shuffle:
                    excerpt = indices[start_idx:start_idx + batchsize]
                    inputs = [self.inputs[x] for x in excerpt]
                else:
                    excerpt = slice(start_idx, start_idx + batchsize)
                    inputs = self.inputs[excerpt]

                #Decode image if datastyle is image
                if datastyle=='image':
                    x = np.empty((batchsize,)+self.imagesize,dtype=np.float32)
                    for ix, filename in enumerate(inputs):
                        im = io.imread(filename)

                        if preprocessor:
                            im = preprocessor(1.0*im)
                        if resize:
                            im = transform.resize(im, self.imagesize).astype(np.float32)
                        if zeromean:
                            im=1.0*im-127
                        if normalize:
                            im=im/255.0
                        #Batch it up
                        x[ix, :] = im

                #Return path to sample if datastyle is path
                if datastyle=='path':
                    x=[self.inputs[ix] for ix in excerpt]

                yield x, self.getLabelbatch(excerpt=excerpt, returnstyle=labelstyle)

            if not startOverAfterFinished:
                break


    # Create a batch of labels based on the specified returntype
    def getLabelbatch(self, excerpt, returnstyle):
            if returnstyle == 'numerical':
                return np.array(self.targetsNumerical)[excerpt]
            if returnstyle == 'onehot':
                return np.array(self.targetsOneHot)[excerpt]
            if returnstyle == 'label':
                return (np.array(self.targets)[excerpt]).tolist()
            if returnstyle == 'path':
                return (np.array(self.targets)[excerpt]).tolist()
                #TODO: just return the path to the annotation file, e.g. image or label
            #In semantic segmentation, the target is an image
            if returnstyle == 'image':
                inputs = self.targets[excerpt]
                y = np.empty((len(excerpt),)+self.imagesize,dtype=np.float32)
                for ix, filename in enumerate(inputs):
                    im = io.imread(filename)
                    y[ix, :] = transform.resize(im, self.imagesize)
                return y


    def getImagesAndLabels(self, indices=None, returnstyle='numerical', shuffle=False, zeromean=False, normalize=False, resize=True, preprocessor=None):
        if indices==None: #If not defined, load all
            indices=list(range(self.nSamples))
        if shuffle:
            np.random.shuffle(indices)

        inputs = [self.inputs[x] for x in indices]

        #x = np.empty((len(indices),)+self.imagesize,dtype=np.float32)

        x = []

        for ix, filename in enumerate(inputs):
            print('loading im '+str(ix)+' of '+str(len(indices)))
            im = io.imread(filename)

            if preprocessor:
                im = preprocessor(1.0*im)
            if resize:
                im = transform.resize(im, self.imagesize).astype(np.float32)
            if zeromean:
                im=1.0*im-127
            if normalize:
                im=im/255.0
            #Batch it up
            x.append(im)


        if returnstyle == 'numerical':
            return x, np.array(self.targetsNumerical)[indices]
        if returnstyle == 'onehot':
            return x, np.array(self.targetsOneHot)[indices]
        if returnstyle == 'label':
            return x, (np.array(self.targets)[indices]).tolist()

    #Update one-hot targets
    def updateOneHotTargets(self, numClasses=None):
        #Use numClasses for overwriting the number of targets in current dataset.
        #Useful if, e.g. the test-set only contains 3 classes and the training contains 5 classes
        if not numClasses:
            numClasses = self.nClasses
        self.targetsOneHot = np.eye(numClasses)[self.targetsNumerical].astype(np.int32)

    #Update targets numerical
    def updateTargetsNumericalStrings(self):
        self.targetsNumericalStrings = [str(x) for x in self.targetsNumerical]


    # Update image-list from csv-file
    def inputsFromCSV(self, csvpath, delimiter=';', numericalTargets=False):
        self.inputpath = csvpath

        import csv
        with open(csvpath, 'rb') as csvfile:
            csvreader = csv.reader(csvfile, delimiter=delimiter, quotechar='"')
            next(csvreader, None)  # Skip header
            for row in csvreader:
                self.inputs.append(row[0])
                self.targets.append(row[2])
                self.targetsNumerical.append(int(row[1]))

        self.updateDicts()
        self.updateDataStats()


    def exportCSV(self, exportpath, delimiter=';'):
        import pandas as pd
        pathAndLables=list(zip(self.inputs,self.targetsNumerical))
        pd.DataFrame(pathAndLables).to_csv(exportpath,sep=delimiter,header=False, index=False)


    def exportTFrecords(self, exportname='train.tfrecords'):
        import tensorflow as tf

        def _int64_feature(value):
            return tf.train.Feature(int64_list=tf.train.Int64List(value=[value]))
        def _bytes_feature(value):
            return tf.train.Feature(bytes_list=tf.train.BytesList(value=[value]))


        # open the TFRecords file
        writer = tf.python_io.TFRecordWriter(exportname)
        for img, label in self.iterate_minibatchesImage(batchsize=1, shuffle=False, returnstyle='numerical', zeromean=False, normalize=False):

            # Create a feature
            feature = {'train/label': _int64_feature(label),
                       'train/image': _bytes_feature(tf.compat.as_bytes(img.tostring()))}
            # Create an example protocol buffer
            example = tf.train.Example(features=tf.train.Features(feature=feature))

            # Serialize to string and write on the file
            writer.write(example.SerializeToString())

        writer.close()


    def updateDicts(self):
        self.numericalDictionary = {key:ix for ix,key in enumerate(list(set(self.targets)))}
        self.labelsDict = {ix:key for ix,key in enumerate(list(set(self.targets)))}


    #Create list of images from input path, where folder-names are used as labels
    def inputsFromFilePath(self, filepath, targetpath=None, labelspath=None):
        self.inputpath = filepath
        # Find all images in folder and subfolder
        for root, dirnames, filenames in os.walk(filepath):
            for filename in filenames:
                if filename.lower().endswith(('.jpg', '.jpg', '.png', '.tif', '.tiff')):
                    self.inputs.append(os.path.join(root, filename))


        #Use foldername as targets if targets is not specified
        if targetpath is None:
            self.targets = [x.split('/')[-2] for x in self.inputs]

        #If a path for targets is specied, match targets by filename with the inputs
        else:
            #Get all files in the targets directory
            targetstmp=[]
            for root, dirnames, filenames in os.walk(targetpath):
                for filename in filenames:
                    targetstmp.append(os.path.join(root, filename))

            #for all images, find their targets
            for inp in self.inputs:
                #targ = [x for x in targetstmp if os.path.splitext(os.path.basename(x))[0]==os.path.splitext(os.path.basename(inp))[0]]
                targ = [x for x in targetstmp if fileparts(x)[1]==fileparts(inp)[1]]

                assert(len(targ)>0)
                self.targets.append(targ[0])


        #Load labelspath if path is given as input
        if labelspath:
            self.loadDict(labelspath)


        # Create  numerical labels if they do not exist
        if not self.numericalDictionary:
            self.updateDicts()

        self.targetsNumerical = [self.numericalDictionary[x] for x in self.targets]
        self.updateDataStats()

    def updateDataStats(self):
        self.nSamples = len(self.inputs)
        self.nClasses = len(self.numericalDictionary)
        self.updateOneHotTargets()
        self.updateTargetsNumericalStrings()

    def exportDict(self,labelpath='labels.txt'):
        with open(labelpath,'w') as f:
            f.write('\n'.join([str(k)+':'+self.labelsDict[k] for k in self.labelsDict.keys()]))

    def loadDict(self,dictpath):
        with open(dictpath,'r') as f:
            dt = f.readlines()
            dt = [d.split(':') for d in dt]
            dt = [[int(d[0]),d[1]] for d in dt]
            self.labelsDict = dict(dt)


def fileparts(filepath):
    return os.path.dirname(filepath), os.path.splitext(os.path.basename(filepath))[0], os.path.splitext(filepath)[-1]


## Usage:
##   trainpath = './Train'
##   testpath = './Test'
##   il_train2, il_test2 = imageLoader.setupTrainValAndTest(trainpath=trainpath,testpath=testpath,valpath=None,imagesize=(28,28,3))
##


def setupTrainValAndTestFromOneInput(datapath=None,testFraction=0.2,ValFraction=0.2,TrainFraction=0.6):
    assert datapath is not None
    #TODO: Not yet implemented


def setupTrainValAndTest(trainpath=None,testpath=None,valpath=None,trainlabelpath=None,testlabelpath=None,vallabelpath=None,imagesize=(None,None,None)):
    assert trainpath is not None
    # Setup classes, and make correct label setup between the three classes
    returnClasses=[]
    if trainpath:
        il_train = imageLoader()
        il_train.imagesize = (imagesize[0],imagesize[1],imagesize[2])
        if os.path.isfile(trainpath):
            il_train.inputsFromCSV(trainpath)
        else:
            il_train.inputsFromFilePath(trainpath)
        il_train.updateDataStats()
        returnClasses.append(il_train)
    if testpath:
        il_test = imageLoader()
        il_test.numericalDictionary = il_train.numericalDictionary #Use same dictionary as for training
        il_test.imagesize = (imagesize[0],imagesize[1],imagesize[2])
        if os.path.isfile(testpath):
            il_test.inputsFromCSV(testpath)
        else:
            il_test.inputsFromFilePath(testpath)
        il_test.updateOneHotTargets(numClasses=il_train.nClasses)
        returnClasses.append(il_test)
    if valpath:
        il_val = imageLoader()
        il_val.numericalDictionary = il_train.numericalDictionary #Use same dictionary as for training
        il_val.imagesize = (imagesize[0],imagesize[1],imagesize[2])
        if os.path.isfile(testpath):
            il_val.inputsFromCSV(valpath)
        else:
            il_val.inputsFromFilePath(valpath)
        il_val.updateOneHotTargets(numClasses=il_train.nClasses)
        returnClasses.append(il_val)
    # Return an instance for train, val and test if paths are provided
    return returnClasses