Classifier.py

"""
James Quintero
Created: 2019
"""


#Local files
from DICOM_reader import DICOMReader
from DataHandler import DataHandler
from ImagePreprocessor import *
from DataGenerator import DataGenerator


import sys
import os
import random
import json
import scipy
import imageio
from datetime import datetime

#ML libraries
import numpy as np

#Sklearn
from sklearn.metrics import confusion_matrix
from sklearn.metrics import accuracy_score
from sklearn.model_selection import KFold
from sklearn.utils import resample

#Scipy
from scipy.optimize import differential_evolution

import keras
from keras import backend as K

#Layers
from keras.layers import Input
from keras.layers import *

#Models
from keras.models import Sequential
from keras.models import Model
from keras.models import load_model

#Callback methods
from keras.callbacks import EarlyStopping
from keras.callbacks import ModelCheckpoint

#Regularizers
from keras.regularizers import l2
from keras.regularizers import l1

#constraints
from keras.constraints import max_norm

from keras.utils import np_utils
from keras.preprocessing.image import ImageDataGenerator
from keras.optimizers import Adam


#For my windows machine
os.environ['CUDA_VISIBLE_DEVICES'] = '-1'


"""

Handles differen types (binary, segmentation) classification training, validation, and testing

"""
class Classifier(ABC):
    project = ""

    image_width = 512
    image_height = 512

    model_archs = {"cnn": "cnn", "unet": "unet"}

    dicom_reader = None
    data_handler = None
    image_preprocessor = None

    hyperparameters = {}

    def __init__(self, project):
        self.dicom_reader = DICOMReader()
        self.data_handler = DataHandler()

        self.project = project.lower()
        if self.project=="chest_radiograph":
            self.image_preprocessor = ChestRadiograph()

        self.hyperparameters = self.data_handler.load_hyperparameters()


    #returns proper filename prefix for specified model_arch, e.x: "cnn" returns "cnn" for use in "./cnn_model.h5"
    def get_model_arch_filename_prefix(self, model_arch):
        try:
            return self.model_archs[model_arch.lower()]
        except Exception as error:
            return ""

    """
    returns list of paths to processed image files
    dataset_type = {"train", "test"}
    label_type = {"binary", "segmentation"}
    """
    def get_processed_image_paths(self, dataset_type="train", label_type="binary", balanced=False, max_num=None):

        if dataset_type.lower() == "train":
            image_paths = self.dicom_reader.load_filtered_dicom_train_paths()
        elif dataset_type.lower() == "test":
            image_paths = self.dicom_reader.load_filtered_dicom_test_paths()


        #if user wants paths where it's 50% positive, and 50% negative
        if balanced:
            print("Loading balanced amount of positive and negative targets")
            new_image_paths = []
            negative = []
            positive = []

            for i in range(0, len(image_paths)):
                image_path = image_paths[i]

                #extracts image_id from the file path
                image_id = self.dicom_reader.extract_image_id(image_paths[i], self.image_preprocessor.preprocessed_ext)

                #finds positive mask associated with the image
                masks = self.data_handler.find_masks(image_id=image_id)

                #if Negative
                if len(masks)==0:
                    #makes sure haven't added too many negative labels
                    if (max_num==None and len(negative)<int(len(image_paths)/2)) or (max_num!=None and len(negative)<int(max_num/2)):
                        negative.append(image_path)
                #if Positive
                else:
                    #makes sure haven't added too many positive labels
                    if (max_num==None and len(positive)<int(len(image_paths)/2)) or (max_num!=None and len(positive)<int(max_num/2)):
                        positive.append(image_path)

                #if found enough of both positive and negative
                if max_num!=None and len(positive)+len(negative)>=max_num:
                    break


            #resize negative and positive arrays to match each other
            if len(positive)>len(negative):
                positive = positive[:len(negative)]
            elif len(positive)<len(negative):
                negative = negative[:len(positive)]

            #shuffles positives and negatives
            image_paths = []
            image_paths.extend(positive)
            image_paths.extend(negative)
            random.seed(12345)
            random.shuffle(image_paths)


        #if user doesn't want an explicit balance of positive and negative signals
        else:
            #if no max, set max to the number of train items
            if max_num!=None and max_num<=len(image_paths) and max_num>0:
                image_paths = image_paths[:max_num]


        return image_paths


    """
    returns statistical measures related to confusion matrix
    confusion_matrix is in the following format
    [TN  FP]
    [FN  TP]
    """
    def calculate_statistical_measures(self, confusion_matrix):
        statistical_measures = {}


        try:
            #True Negative
            TN = confusion_matrix[0][0]
            statistical_measures['TN'] = TN
            #False Positive
            FP = confusion_matrix[0][1]
            statistical_measures['FP'] = FP
            #False Negative
            FN = confusion_matrix[1][0]
            statistical_measures['FN'] = FN
            #True Positive
            TP = confusion_matrix[1][1]
            statistical_measures['TP'] = TP
        except Exception as error:
            print("Mishapen confusion matrix") 
            return {}


        #https://en.wikipedia.org/wiki/Confusion_matrix

        if (TN+FP+FN+TP)>0:
            accuracy = (TN+TP)/(TN+FP+FN+TP)
        else:
            accuracy = 0
        statistical_measures['accuracy'] = accuracy

        if TP>0:
            precision = TP/(FP+TP)
        else:
            precision = 0
        statistical_measures['precision'] = precision

        if TN>0:
            negative_predictive_value = TN/(TN+FN)
        else:
            negative_predictive_value = 0
        statistical_measures['NPV'] = negative_predictive_value


        if TP>0:
            F1 = (2*TP) / (2*TP + FP + FN) 
        else:
            F1 = 0
        statistical_measures['F1'] = F1


        if TP > 0:
            sensitivity = TP/(TP+FN)
        else:
            sensitivity = 0
        statistical_measures['sensitivity'] = sensitivity


        #Matthews correlation coefficient (great for binary classification)
        #https://en.wikipedia.org/wiki/Matthews_correlation_coefficient
        try:
            MCC = (TP*TN - FP*FN)/np.sqrt((TP+FP)*(TP+FN)*(TN+FP)*(TN+FN))
        except Exception as error:
            MCC = 0
        statistical_measures['MCC'] = MCC


        #when it's a downmove, how often does model predict a downmove?
        if TN>0:
            specificity = TN/(TN+FP)
        else:
            specificity = 0
        statistical_measures['specificity'] = specificity


        #False Positive Rate (FPR) (Fall-Out)
        FPR = 1 - specificity
        statistical_measures['FPR'] = FPR

        #False Negative Rate (FNR)
        FNR = 1 - sensitivity
        statistical_measures['FNR'] = FNR

        #both TPR (sensitivity) and FPR (100-Specificity) are used to plot the ROC (Receiver Operating Characteristic) curve
        #https://www.medcalc.org/manual/roc-curves.php
        ROC = sensitivity - FPR
        statistical_measures['ROC'] = ROC


        #want to get 200%, 100% for sensitivity and 100% for specificity
        #https://en.wikipedia.org/wiki/Youden%27s_J_statistic
        total = sensitivity + specificity
        statistical_measures['total'] = total


        return statistical_measures


    def dice_coef(self, y_true, y_pred):
        smooth = 1.
        y_true_f = K.flatten(y_true)
        y_pred_f = K.flatten(y_pred)
        intersection = K.sum(y_true_f * y_pred_f)
        return (2. * intersection + smooth) / (K.sum(y_true_f) + K.sum(y_pred_f) + smooth)


    def dice_coef_loss(self, y_true, y_pred):
        return 1-self.dice_coef(y_true, y_pred)

    """
    Returns simple default CNN architecture
    """
    @abstractmethod
    def create_CNN(self):
        # Initialising the CNN
        classifier = Sequential()

        CNN_size = 16
        pool_size = (3,3)
        filter_size = (3,3)
        CNN_activation = "selu"
        dense_activation = "selu"
        output_activation = "linear"
        loss = "mean_squared_error"

        classifier.add(Convolution2D(CNN_size, filter_size, input_shape = (self.image_width, self.image_height, 1), padding="same", activation = CNN_activation))

        # Step 2 - Pooling
        #pooling uses a 2x2 or something grid (most of the time is 2x2), goes over the feature maps, and the largest values as its going over become the values in the pooled map
        #slides with a stride of 2. At the end, the pool map should be (length/2)x(width/2)
        classifier.add(MaxPooling2D(pool_size = pool_size))
        classifier.add(Dropout(0.25))

        # Adding a second convolutional layer
        classifier.add(Convolution2D(CNN_size, filter_size, padding="same", activation = CNN_activation))
        classifier.add(MaxPooling2D(pool_size = pool_size))
        classifier.add(Dropout(0.25))

        # Adding a second convolutional layer
        classifier.add(Convolution2D(CNN_size, filter_size, padding="same", activation = CNN_activation))
        classifier.add(MaxPooling2D(pool_size = pool_size))
        classifier.add(Dropout(0.25))

        # Adding a second convolutional layer
        classifier.add(Convolution2D(CNN_size, filter_size, padding="same", activation = CNN_activation))
        classifier.add(MaxPooling2D(pool_size = pool_size))
        classifier.add(Dropout(0.25))

        #flattents the layers
        classifier.add(Flatten())

        #128 is an arbitrary number that can be decreased to lower computation time, and increased for better accuracy
        classifier.add(Dense(units = 128, activation = dense_activation))
        classifier.add(Dropout(0.25))

        classifier.add(Dense(units = 1, activation = output_activation))

        classifier.compile(optimizer = 'adam', loss = loss, metrics = ['accuracy'])
        # classifier.compile(optimizer = 'adam', loss=self.dice_coef_loss, metrics=[self.dice_coef])

        classifier.summary()

        return classifier


    """
    returns very simple U-net
    architecture source: https://github.com/yihui-he/u-net
     and https://github.com/jocicmarko/ultrasound-nerve-segmentation/
    """
    @abstractmethod
    def create_Unet(self):

        start_size = 16
        pool_size = (2,2)
        filter_size = (3,3)
        conv_activation = "selu"
        dense_activation = "selu"
        output_activation = "sigmoid"


        inputs = Input((self.image_width, self.image_height, 1))
        conv1 = Conv2D(start_size*1, filter_size, activation=conv_activation, padding='same')(inputs)
        conv1 = Conv2D(start_size*1, filter_size, activation=conv_activation, padding='same')(conv1)
        conv1 = BatchNormalization()(conv1)
        pool1 = MaxPooling2D(pool_size=pool_size)(conv1)

        conv2 = Conv2D(start_size*2, filter_size, activation=conv_activation, padding='same')(pool1)
        conv2 = Conv2D(start_size*2, filter_size, activation=conv_activation, padding='same')(conv2)
        conv2 = BatchNormalization()(conv2)
        pool2 = MaxPooling2D(pool_size=pool_size)(conv2)

        conv3 = Conv2D(start_size*4, filter_size, activation=conv_activation, padding='same')(pool2)
        conv3 = Conv2D(start_size*4, filter_size, activation=conv_activation, padding='same')(conv3)
        conv3 = BatchNormalization()(conv3)

        up8 = concatenate([Conv2D(start_size*2, pool_size, activation=conv_activation, padding='same')(UpSampling2D(size=pool_size)(conv3)), conv2], axis=3)
        conv8 = Conv2D(start_size*2, filter_size, activation=conv_activation, padding='same')(up8)
        conv8 = Conv2D(start_size*2, filter_size, activation=conv_activation, padding='same')(conv8)
        conv8 = BatchNormalization()(conv8)

        up9 = concatenate([Conv2D(start_size*1, pool_size,activation=conv_activation, padding='same')(UpSampling2D(size=pool_size)(conv8)), conv1], axis=3)
        conv9 = Conv2D(start_size*1, filter_size, activation=conv_activation, padding='same')(up9)
        conv9 = Conv2D(start_size*1, filter_size, activation=conv_activation, padding='same')(conv9)
        conv9 = BatchNormalization()(conv9)

        conv10 = Convolution2D(1, (1, 1), activation=conv_activation)(conv9)
        # model = Model(inputs=inputs, outputs=conv10)


        dense1 = Flatten()(conv10)

        dense2 = Dense(units = 1, activation = output_activation)(dense1)

        
        model = Model(inputs=inputs, outputs=dense2)

        model.compile(optimizer=Adam(lr=1e-5), loss="mean_squared_error", metrics=["accuracy"])

        model.summary()

        return model

    """
    returns parameters for the data generator depending on what procress of teh model creation we are in
    """
    def get_data_generator_params(self, step="train"):
        # Parameters
        params = {'dim': (self.image_height,self.image_width,1),
                  'augment': True,
                  'shuffle': True}

        if step.lower() == "train":
            params['augment'] = True
            params['shuffle'] = True

        elif step.lower() == "test":
            params['augment'] = False
            params['shuffle'] = False

        return params

    """
    returns Data Generator
    """
    @abstractmethod
    def create_data_generator(self, feature_dataset, label_dataset, batch_size, step="train"):
        params = self.get_data_generator_params(step=step)

        data_generator = DataGenerator(feature_dataset, label_dataset, batch_size, "binary", **params)

        return data_generator


    """
    returns list of individual confusion matrices if segmentation, and list of size 1 for binary
    """
    @abstractmethod
    def calculate_confusion_matrices(self, target_data, prediction_data):

        #calculates confusion matrix
        conf_matrix = confusion_matrix(y_non_category, y_predict_non_category)

        return conf_matrix


    def print_statistical_measures(self, stats):
        print("----------------------------------")
        confusion_matrix = [[stats['TN'], stats['FP']], [stats['FN'], stats['TP']]]
        self.print_confusion_matrix(confusion_matrix)
        print("----------------------------------")
        print("Accuracy:                "+str(stats['accuracy']))
        print("----------------------------------")
        print("False Positive Rate:     "+str(stats['FPR']))
        print("False Negative Rate:     "+str(stats['FNR']))
        print("PPV (Precision):         "+str(stats['precision']))
        print("----------------------------------")
        print("Specificity:             "+str(stats['specificity']))
        print("Sensitivity:             "+str(stats['sensitivity']))
        print("Total (spec + sens):     "+str(stats['total']))
        print("----------------------------------")
        print("ROC:                     "+str(stats['ROC']))
        print("F1:                      "+str(stats['F1']))
        print("MCC:                     "+str(stats['MCC']))
        print("----------------------------------")
        # print()


    """
    prints confusion matrix in format
    [    TN,   FP]
    [    FN,   TP]
    """
    def print_confusion_matrix(self, confusion_matrix):
        print("[{0:5d}, {1:5d}]".format(int(confusion_matrix[0][0]), int(confusion_matrix[0][1])))
        print("[{0:5d}, {1:5d}]".format(int(confusion_matrix[1][0]), int(confusion_matrix[1][1])))


    """
    Calculates statistical measures for each image in target_data 
    Aggregates confusion matrices and statistical measures
    """
    def statistical_analysis(self, target_data, prediction_data, verbose=False):

        if verbose:
            print("Target data: "+str(len(target_data)))
            print("Prediction data: "+str(len(prediction_data)))


        #calculates confusion matrix
        conf_matrices = self.calculate_confusion_matrices(target_data, prediction_data)


        agg_conf_matrices = np.zeros(conf_matrices[0].shape)
        all_stats = []
        for x in range(0, len(conf_matrices)):
            conf_matrix = conf_matrices[x]
            
            stats = self.calculate_statistical_measures(conf_matrix)

            if verbose:
                print("Confusion matrix "+str(x)+": ")
                print(conf_matrix)
                self.print_statistical_measures(stats)

            agg_conf_matrices += conf_matrix
            all_stats.append(stats)


        agg_stats = self.calculate_statistical_measures(agg_conf_matrices)

        if verbose:
            print("Aggregate confusion matrix: ")
            print(agg_conf_matrices)
            self.print_statistical_measures(agg_stats)


        average_stats = {}
        #iterates through all statistical metrics
        for stat in all_stats[0]:
            average_stats[stat] = 0

            #iterates through all confusion matrices' states
            for x in range(0, len(all_stats)):
                try:
                    average_stats[stat] += all_stats[x][stat]
                except Exception as error:
                    continue

            average_stats[stat] /= len(all_stats)

        if verbose:
            print()
            print()
            print("Average stats: ")
            self.print_statistical_measures(average_stats)


        return (all_stats, agg_stats)


    """
    predicts on the dataset, and prints a confusion matrix of the results

    Returns a 2 item tuple where 0th item is all stats, and 1st item is aggregate stats
    """
    def prediction_analysis(self, classifier, feature_dataset, full_label_dataset, batch_size=1, verbose=False):
        generator = self.create_data_generator(feature_dataset, full_label_dataset, batch_size, "test")

        print("Predicting...")
        preds = classifier.predict_generator(generator, steps=int(len(feature_dataset)/batch_size))

        try:
            print("Feature dataset: "+str(feature_dataset.shape))
            print("predictions: "+str(preds.shape))
        except Exception as ex:
            pass

        #gets actual labels
        X_images, y_non_category = generator.get_processed_images(start=0, end=len(feature_dataset))
        #gets predicted labels
        y_predict_non_category = [ t>0.5 for t in preds]

        return self.statistical_analysis(y_non_category, y_predict_non_category, verbose)


    """
    Ensemble prediction for multi-class classification
    Returns weighted predicted determined by the weight of the model making those predictions
    params: 
        models are a list of keras models
        weights are a 2D list of lists of weights
        X_test is a single test dataset
    """
    def ensemble_predictions(self, models, weights, X_test):

        # make predictions
        predictions = []
        for model in models:
            generator = self.create_data_generator(X_test, [], 1, "test")
            preds = model.predict_generator(generator, steps=len(X_test))
            predictions.append(preds)

        predictions = np.array(predictions)

        # weighted sum of all predictions
        summed = np.tensordot(predictions, weights, axes=((0),(0)))

        # argmax across classes
        # result = np.argmax(summed, axis=1)
        # result = summed/len(models)
        result = summed
        
        return result


    """
    Loss function for optimization process, designed to be minimized
    Should be used in differential evolution algorithm
    """
    def weighted_averaging_loss_function(self, weights, models, X_test, Y_test):
        # normalize weights
        normalized_weights = self.normalize(weights)
        # calculate error rate
        error_rate = 1.0 - self.evaluate_ensemble(models, normalized_weights, X_test, Y_test)
        return error_rate


    """
    normalize a vector to have unit norm
    """
    def normalize(self, weights):
        #calculate l1 vector norm
        result = np.linalg.norm(weights, 1)

        #prevents division by zero
        if result == 0.0:
            return weights

        #returns normalized vector
        return weights / result


    """
    Evaluates a specific number of models in a weighted ensemble
    """
    def evaluate_ensemble(self, models, weights, X_validate, y_validate):
        predictions = self.ensemble_predictions(models, weights, X_validate)

        y_validate = np.array(y_validate.copy())
        predictions = np.array(predictions)

        #self.prediction_analysis?

        #converts to binary
        predictions = [ t>0.5 for t in predictions]

        #determines accuracy of the predictions
        accuracy = accuracy_score(y_validate, predictions)
        print("Weights: "+str(weights)+" | Accuracy: "+str(accuracy))
        # print()
        return accuracy


    """
    Performs weight optimization to find the optimal weights for each model to optimize performance on the provided validation dataset
    """
    def get_optimal_weights(self, models, X_validate, Y_validate):
        #averaging ensemble (equal weights)
        initial_weights = [1.0/len(models) for weight in range(len(models))]
        score = self.evaluate_ensemble(models, initial_weights, X_validate, Y_validate)
        print('Equal Weights Score: %.3f' % score)


        # define bounds on each weight
        weight_bounds = [(0.0, 1.0) for model in range(len(models))]
        # arguments to the loss function
        search_arg = (models, X_validate, Y_validate)

        #Performs an optimization function in regards to the provided loss function to get optimal weights
        print("Performing Differential Evolution to calculate optimal weights")
        result = differential_evolution(func = self.weighted_averaging_loss_function, 
                                        bounds = weight_bounds, 
                                        args = search_arg, 
                                        maxiter = 1, #standard could be 1000
                                        tol = 1e-7,
                                        disp = True)

        # get the chosen weights
        weights = self.normalize(result['x'])
        print('Optimized Weights: %s' % weights)


        # evaluate chosen weights
        score = self.evaluate_ensemble(models, weights, X_validate, Y_validate)
        print('Optimized Weights Score: %.3f' % score)

        return weights


    """
    Uses a pre-trained model on similar radiographs or data, and uses it as a starting point for this model. 
    This allows for features already learned to be a starting point, and for hidden layer weights to be the initial weights. 
    Transfer learning benefits by having much better generalization, meaning less standard deviation, and higher accuracy overall. 
    """
    def transfer_learning(self):
        pass


    """
    Iterates through many combinations of hyperparameters and returns the best performing model along with its hyperparameters
    Used to determine best hyperparameters instead of manually manipulation
    """
    def grid_search(self):
        hyperparameters = {}


    """
    A resampling technique used to estimate statistics on a population by sampling a dataset with replacement.
    Also known as Bootstrapping or Bootstrap Aggregation
    Can keep adding ensemble members since bagging does not overfit
    https://machinelearningmastery.com/a-gentle-introduction-to-the-bootstrap-method/
    """
    def bagging(self, num_models = 1, **train_args):
        print("Train arguments: "+str(train_args))
        dataset_size = train_args['dataset_size']
        X = self.get_processed_image_paths(balanced=train_args['balanced'], max_num=dataset_size)
        Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths

        print("Dataset size: "+str(dataset_size))
        print("num models: "+str(num_models))
        print()


        #list of indices running the length of X
        indices = [i for i in range(len(X))]


        classifiers = []
        X_trains = []
        X_validates = []
        X_tests = []
        Ys = []
        Y_validates = []
        results = []
        for section in range(0, num_models):

            ## Performes the resampling with replacement ##
            train_indices = resample(indices, replace=True, n_samples=int(len(indices)*0.8))
            validation_indices = [x for x in indices if x not in train_indices]
            # select data
            trainX = [X[x] for x in train_indices]
            validationX = [X[x] for x in validation_indices]


            print("Train X len: "+str(len(trainX)))
            print("Validate X len: "+str(len(validationX)))

            train_args['X'] = trainX
            train_args['Y'] = Y


            classifier, X_train_section, X_validate_section, X_test_section, Y_section = self.train(**train_args)
            classifiers.append(classifier)
            X_trains.append(X_train_section)
            X_validates.append(validationX)
            X_tests.append(X_test_section)
            Ys.append(Y_section)

            #gets output validation data
            generator = self.create_data_generator(X_validates[-1], Y, len(X_validates[-1]), "test")
            X_images, y_non_category = generator.get_processed_images(start=0, end=len(X_validates[-1]))
            Y_validates.append(y_non_category)

            print("Len X_Validate: "+str(len(X_validates[-1])))
            print("Len Y_validate: "+str(len(y_non_category)))
            print()

            #prints performance on the validation dataset
            self.prediction_analysis(classifier, X_validates[-1], Y, batch_size=1, verbose=True)


        #also returns the optimal weights
        return classifiers, X_trains, X_validates, X_tests, Ys


    """
    Creates an ensemble from the models contained in the training history of a single model's training session 
    Useful if there's high variance during the model training, or if training multiple models 
    in other ensemble methods in infeasable due to the model's size and training timeframe. 
    """
    def horizontal_voting_ensemble(self, num_models = 1, **train_args):
        pass


    """
    Snapshot ensemble involves using an aggressive learning rate during training to get a 
    diverse collection of models to ensemble during a training session
    The aggressive learning rate allows for models in the same training session over close epochs to not be so similar to each other
    Useful for deep learning where the computation cost of training is extremely high
    """
    def snapshot_ensemble(self):
        pass


    """
    Incorporates the technique of model-averaging ensembling, which is the process of training multiple of the same neural networks on the same training set, 
    then averaging their predictions. 
    This ensembling method can also be weighted, where different models have different weights depending on their performing on a validation dataset
    """
    def weighted_model_averaging(self, num_models = 1, **train_args):
        print("Train arguments: "+str(train_args))
        dataset_size = train_args['dataset_size']
        X = self.get_processed_image_paths(balanced=train_args['balanced'], max_num=dataset_size)
        Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths

        print("Dataset size: "+str(dataset_size))
        print("num models: "+str(num_models))
        print()


        classifiers = []
        X_trains = []
        X_validates = []
        X_tests = []
        Ys = []
        Y_validates = []
        results = []
        for section in range(0, num_models):
            train_args['X'] = X
            train_args['Y'] = Y

            classifier, X_train_section, X_validate_section, X_test_section, Y_section = self.train(**train_args)
            classifiers.append(classifier)
            X_trains.append(X_train_section)
            X_validates.append(X_validate_section)
            X_tests.append(X_test_section)
            Ys.append(Y_section)

            #gets output validation data
            generator = self.create_data_generator(X_validate_section, Y, len(X_validate_section), "test")
            X_images, y_non_category = generator.get_processed_images(start=0, end=len(X_validate_section))
            Y_validates.append(y_non_category)

            print("Len X_Validate: "+str(len(X_validate_section)))
            print("Len Y_validate: "+str(len(y_non_category)))
            print()

            #prints performance on the validation dataset
            self.prediction_analysis(classifier, X_validates[-1], Y, batch_size=1, verbose=True)


        print("-- Start Weight Optimization --")
        weights = self.get_optimal_weights(classifiers, X_validates[0], Y_validates[0])
        # weights = [0.39759092, 0.13496959, 0.46743949] #debugging
        print("-- End of Weight Optimization --")


        #also returns the optimal weights
        return classifiers, X_trains, X_validates, X_tests, Ys, weights


    """
    takes a dataset, splits into n_splits+1 sections, then split each of those into train and test sections, 
    then trains a model on each section and ensembles them together to hopefully have one better model that's more stable
    than each model together
    https://www.sciencedirect.com/science/article/pii/S0925231214007644

    Used as an ensemble since a bunch of smaller models might be able to predict better than a large model. 

    """
    # *args are the important arguments for calling train
    def resampling_ensemble(self, n_splits = 0, **train_args):
        dataset_size = train_args['dataset_size']
        X = self.get_processed_image_paths(balanced=train_args['balanced'], max_num=dataset_size)
        Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths

        print("Dataset size: "+str(dataset_size))
        print("n_splits: "+str(n_splits))

        section_size = int(dataset_size/(n_splits+1))

        print("Section size: "+str(section_size))
        print()


        classifiers = []
        X_trains = []
        X_validates = []
        X_tests = []
        Ys = []
        results = []
        for section in range(0, n_splits+1):
            print("Section: "+str(section+1)+"/"+str(n_splits+1))
            start = section*section_size
            end = min((section+1)*section_size, len(X))

            print("Start: "+str(start)+" : "+str(end))

            X_section = X[start:end]

            #trains on this section
            train_args['X'] = X_section
            train_args['Y'] = Y


            classifier, X_train_section, X_validate_section, X_test_section, Y_section = self.train(**train_args)
            classifiers.append(classifier)
            X_trains.append(X_train_section)
            X_validates.append(X_validate_section)
            X_tests.append(X_test_section)
            Ys.append(Y_section)


            #performs prediction analysis on results
            prediction_analysis = self.prediction_analysis(classifier=classifier, 
                                                        feature_dataset=X_validate_section, 
                                                        full_label_dataset=Y_section, 
                                                        batch_size=train_args['batch_size'])

            results.append(prediction_analysis)


        return classifiers, X_trains, X_validates, X_tests, Ys


    """
    takes a dataset, gets k_folds so that 0.8 of the dataset is for training, 0.2 is for testing, and this portion moves 
    throughout the dataset so that by the end, each portion of the dataset got a chance to be the test portion. 
    https://en.wikipedia.org/wiki/Cross-validation_(statistics)

    Used to judge performance of a model arch on a dataset

    """
    def kfold_cross_validation(self, k_folds = 0, **train_args):

        if k_folds<2:
            print("Error, K-folds must have at least 2 folds. Please change hyperparameters and reflect that. ")
            return None, None, None, None, None

        print("Train arguments: "+str(train_args))
        dataset_size = train_args['dataset_size']
        X = self.get_processed_image_paths(balanced=train_args['balanced'], max_num=dataset_size)
        Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths

        print("Total Feature size: "+str(len(X)))


        seed = 12345

        #creates keras Kfold object
        kfold = KFold(n_splits=k_folds, shuffle=True, random_state=seed)


        classifiers = []
        X_trains = []
        X_validates = []
        X_tests = []
        Ys = []
        results = []
        fold_index = 1
        for train_indices, test_indices in kfold.split(X):
            print()
            print("Split "+str(fold_index)+"/"+str(k_folds))
            print("Split Train size: "+str(len(train_indices)))
            print("Split Test size: "+str(len(test_indices)))

            #converts train array into numpy array in order to split by list of indices, 
            #then converts back to list to be compatible during train method
            train_args['X'] = list(np.array(X)[train_indices])
            train_args['Y'] = Y
            

            #Be careful of using easly stopping while performing k-fold cross validation
            classifier, X_train, X_validate, X_test, Y_section = self.train(**train_args)

            classifiers.append(classifier)
            X_trains.append(X_train)
            X_validates.append(X_validate)
            X_tests.append(X_test)
            Ys.append(Y_section)


            #performs prediction analysis on results
            prediction_analysis = self.prediction_analysis(classifier=classifier, 
                                                        feature_dataset=X_validate_section, 
                                                        full_label_dataset=Y, 
                                                        batch_size=train_args['batch_size'])

            fold_index += 1


        return classifiers, X_trains, X_validates, X_tests, Ys


    """ 
    Stacked ensemble is an ensemble technique where instead of using linear regression, a neural network is used to calculate 
    optimal weights in a weighted average ensemble.
    """
    def stacked_ensemble(self, **train_args):
        pass


    """
    Training technique for not-so-stable models where the average weights of the models over the past few epochs of training are averaged, 
    and the final model uses those average weights
    """
    def polyak_ruppert_averaging(self):
        # # create a model from the weights of multiple models
        # def model_weight_ensemble(members, weights):
        #     # determine how many layers need to be averaged
        #     n_layers = len(members[0].get_weights())
        #     # create an set of average model weights
        #     avg_model_weights = list()
        #     for layer in range(n_layers):
        #     # collect this layer from each model
        #     layer_weights = array([model.get_weights()[layer] for model in members])
        #     # weighted average of weights for this layer
        #     avg_layer_weights = average(layer_weights, axis=0, weights=weights)
        #     # store average layer weights
        #     avg_model_weights.append(avg_layer_weights)
        # # create a new model with the same structure
        # model = clone_model(members[0])
        # # set the weights in the new
        # model.set_weights(avg_model_weights)
        # model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
        # return model


        pass


    """
    trains model with model_arch architecture
    returns the Keras model, training dataset, validation dataset, testing dataset, and all labels
    """
    # @abstractmethod
    def train(self, model_arch="cnn", dataset_size=100, balanced=False, X=None, Y=None, train_ratio=0.7, val_ratio=0.2, batch_size=1, epochs=1):

        #load features and targets if they aren't provided
        if X is None:
            X = self.get_processed_image_paths(balanced=balanced, max_num=dataset_size)
        if Y is None:
            Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths


        #splits into training, validation, and test datasets
        X_train, X_validate, X_test = self.data_handler.split_data(X, train_ratio, val_ratio)

        #stops if no data to train on
        if len(X_train)==0:
            return None, None, None, None, None

        print("X_train size: "+str(len(X_train)))
        print("X_validate size: "+str(len(X_validate)))

        #creates the proper specified architecture
        if model_arch.lower() == "cnn": 
            classifier = self.create_CNN()  
        elif model_arch.lower() == "unet":
            classifier = self.create_Unet()
        else:
            print("Unsupported specified model type")
            return


        training_generator = self.create_data_generator(X_train, Y, batch_size, "train")
        validation_generator = self.create_data_generator(X_validate, Y, batch_size, "test")

        best_model_path = "./trained_models/"+str(self.get_model_arch_filename_prefix(model_arch))+"_model.h5"


        ## Creat callbacks 
        # patient early stopping
        try:
            early_stopping = EarlyStopping(monitor='val_loss', mode='min', verbose=1, patience=5, restore_best_weights=False)
            # print("Early stopping with restoring best weights")
        except:
            #keras version is < 2.2.3, so don't include "restore_best_weights" parameter
            early_stopping = EarlyStopping(monitor='val_loss', mode='min', verbose=1, patience=5)

        model_checkpoint = ModelCheckpoint(best_model_path, monitor='val_loss', mode='min', save_best_only=True, save_weights_only=False, period=1, verbose=0)
        callback_list = [early_stopping, model_checkpoint]


        # fits the model on batches with real-time data augmentation:
        # for i in range(epochs):
        classifier.fit_generator(generator=training_generator,
                                steps_per_epoch=len(X_train) / batch_size,
                                epochs=epochs,
                                validation_data=validation_generator,
                                validation_steps=len(X_validate), 
                                callbacks = callback_list)

        #loads the best model
        classifier = load_model(best_model_path)


        # classifier.save(best_model_path)

        return classifier, X_train, X_validate, X_test, Y


    """
    trains binary classifier with specified hyperparameters, then evaluates the results and saves to disk
    """
    @abstractmethod
    def train_evaluate(self, classification_type="", model_arch="cnn", training_type="regular"):
        #loads hyperparameters because they might have been changed in the main menu
        self.hyperparameters = self.data_handler.load_hyperparameters()

        train_ratio = self.hyperparameters[classification_type][model_arch]['train_ratio']
        validation_ratio = self.hyperparameters[classification_type][model_arch]['val_ratio']
        batch_size = self.hyperparameters[classification_type][model_arch]['batch_size']
        epochs = self.hyperparameters[classification_type][model_arch]['epochs']
        dataset_size = self.hyperparameters[classification_type][model_arch]['dataset_size']
        balanced = self.hyperparameters[classification_type][model_arch]['balanced']
        n_splits = self.hyperparameters[classification_type][model_arch]['resampling_ensemble_n_splits']
        k_folds = self.hyperparameters[classification_type][model_arch]['kfold_cross_validation_k_folds']
        weight_avg_num_models = self.hyperparameters[classification_type][model_arch]['weighted_avg_ensemble_num_models']
        bagging_num_models = self.hyperparameters[classification_type][model_arch]['bagging_num_models']

        params = {"model_arch": model_arch, 
                    "dataset_size": dataset_size, 
                    "balanced": balanced,
                    "train_ratio": train_ratio,
                    "val_ratio": validation_ratio, 
                    "batch_size": batch_size, 
                    "epochs": epochs}


        classifiers = []
        X_trains = []
        X_validates = []
        X_tests = []
        Ys = []
        periphery = {}

        if training_type.lower() == "regular":
            # #trains model, which returns the trained model and dataset segments
            # classifier, X_train, X_validate, X_test, Y = self.train(**params)
            classifiers, X_trains, X_validates, X_tests, Ys = self.resampling_ensemble(n_splits = 0, **params)

        elif training_type.lower() == "resampling_ensemble":
            classifiers, X_trains, X_validates, X_tests, Ys = self.resampling_ensemble(n_splits = n_splits, **params)

        elif training_type.lower() == "kfold_cross_validation":
            classifiers, X_trains, X_validates, X_tests, Ys = self.kfold_cross_validation(k_folds = k_folds, **params)

        elif training_type.lower() == "weighted_model_averaging":
            classifiers, X_trains, X_validates, X_tests, Ys, opt_weights = self.weighted_model_averaging(num_models = weight_avg_num_models, **params)
            periphery['optimal_weights'] = opt_weights

        elif training_type.lower() == "bagging":
            classifiers, X_trains, X_validates, X_tests, Ys = self.bagging(num_models=bagging_num_models, **params)

        else:
            classifiers, X_trains, X_validates, X_tests, Ys = None


        if classifiers==None:
            print("Something went wrong in train_evaluate()")
            return


        #performs prediction on training portion
        print()
        print("--Training prediction analysis--")
        training_prediction_analysis = []
        try:
            for i in range(0, len(classifiers)):
                training_prediction_analysis.append(self.prediction_analysis(classifier=classifiers[i], 
                                                                            feature_dataset=X_trains[i], 
                                                                            full_label_dataset=Ys[i], 
                                                                            batch_size=batch_size))
        except Exception as error:
            print("Couldn't perform training prediction analysis.")
            print(error)


        #perform prediction on validation portion
        print()
        print("--Validation prediction analysis--")
        validation_prediction_analysis = []
        try:
            for i in range(0, len(classifiers)):
                validation_prediction_analysis.append(self.prediction_analysis(classifier=classifiers[i], 
                                                                                feature_dataset=X_validates[i], 
                                                                                full_label_dataset=Ys[i], 
                                                                                batch_size=batch_size))
        except Exception as error:
            print("Couldn't perform validation prediction analysis.")
            print(error)


        self.save_training_session("binary", training_type, classifiers, model_arch, training_prediction_analysis, validation_prediction_analysis, periphery)


    """
    saves training session, like the trained model, hyperparameters, and results, for future review
    """
    def save_training_session(self, classification_type, training_type, classifiers, model_arch, training_analysis, validation_analysis, periphery_data=None):

        session_dir = self.data_handler.create_new_training_session_dir(project=self.project, classification_type=classification_type, model_arch=model_arch)


        #saves models
        try:
            for x in range(0, len(classifiers)):
                classifiers[x].save(session_dir+"/"+str(self.get_model_arch_filename_prefix(model_arch))+"_"+str(training_type)+"_model_"+str(x+1)+"_of_"+str(len(classifiers))+".h5")
        except Exception as error:
            print("Error, couldn't save model: "+str(error))

        #saves model training history
        try:
            for x in range(0, len(classifiers)):
                accuracy_history = classifiers[x].history['acc']
                val_accuracy_history = classifiers[x].history['val_acc']
                loss_history = classifiers[x].history['loss']
                val_loss_history = classifiers[x].history['val_loss']

                print("accuracy history: "+str(accuracy_history))
                print("Loss history: "+str(loss_history))
        except Exception as error:
            print("Couldn't get model training stats history: "+str(error))
            # pass

        #saves hyperparameters
        new_hyperparameter_path = session_dir+"/hyperparameters.json"
        self.data_handler.copy_hyperparameters(new_hyperparameter_path)

        #Saves training prediction analysis
        for x in range(0, len(training_analysis)):
            to_save = {"all_stats": training_analysis[x][0], "agg_stats": training_analysis[x][1]}
            self.data_handler.save_to_json(session_dir+"/train_stats_"+str(x+1)+"_of_"+str(len(training_analysis))+".json", to_save)


        #Saves Validation prediction analysis
        for x in range(0, len(validation_analysis)):
            to_save = {'all_stats': validation_analysis[x][0], 'agg_stats': validation_analysis[x][1]}
            self.data_handler.save_to_json(session_dir+"/validation_stats_"+str(x+1)+"_of_"+str(len(training_analysis))+".json", to_save)

        #Saves Periphery data
        if periphery_data!=None:
            to_save = periphery_data
            self.data_handler.save_to_json(session_dir+"/periphery_data.json", to_save)


    """
    Reads training session results saved under ./training_sessions folder, then displays data in readable and logical manner
    """
    @abstractmethod
    def view_training_session_results(self, project, classifier_type, model_arch, date, session_num):
        print()

        date_str = datetime.strftime(date, "%Y-%m-%d")

        path = self.data_handler.get_training_session_path(project=project, 
                                                            classification_type=classifier_type, 
                                                            model_arch=model_arch, 
                                                            date=date_str, 
                                                            training_session_num=session_num)
    

        #if path doesn't exist, then exit
        if os.path.exists(path)==False:
            return


        file_list = os.listdir(path)

        #prints the list of files
        for file in file_list:
            print(file)
        print()

        hyperparameters_path = path+"/hyperparameters.json"

        ## prints hyperparameters

        print("-- hyperparameters corresponding to "+str(classifier_type)+" classifier with "+str(model_arch)+" model architecture ")
        hyperparameters = self.data_handler.load_hyperparameters(hyperparameters_path)
        self.data_handler.print_hyperparameters(hyperparameters[classifier_type][model_arch])
        print()

        print()
        print("Saved models: ")
        for file in file_list:
            if ".h5" in file:
                print(file)
        print()
        print()


        #prints training and validation json data
        def print_json_results(file):
            print("#"+str(file).replace(".json", "")) #prints filename
            json_data = self.data_handler.load_json(path+"/"+file)

            agg_stats = json_data['agg_stats']
            print("Aggregate stats: ")
            self.print_statistical_measures(agg_stats)

            
            if len(json_data['all_stats'])>1:
                print()
                print()
                print("Individual stats:")
                for stats in json_data['all_stats']:
                    self.print_statistical_measures(stats)
                    print()


        ## Prints training results
        print()
        print("-- Training Results --")
        for file in file_list:
            #checks if is a training file
            if "train_stats" in file:
                print_json_results(file)
                print()
        print()


        ## Prints validation results
        print()
        print("-- Validation Results --")
        for file in file_list:
            #checks if is a training file
            if "validation_stats" in file:
                print_json_results(file)
                print()
        print()


        ## Prints peripharay data
        for file in file_list:
            if "periphery_data" in file:
                print()
                print("-- Periphery Data --")
                periphery_data = self.data_handler.load_json(path+"/"+file)
                self.data_handler.print_json(periphery_data)


    """
    Takes in the file path to a saved h5 model, 
    then returns results from the model's predictions on a portion of the test dataset
    """
    def test_model(self, model_path="", dataset_size=100, verbose=False):
        max_images = dataset_size
        X = self.get_processed_image_paths(dataset_type="test", balanced=False, max_num=max_images)
        #reads train labels, because the "test" dataset was part of the train dataset
        Y = self.data_handler.read_train_labels() #don't limit, because will use this for finding masks to train_dicom_paths

        print("Retrieved processed image paths: "+str(len(X)))

        #loads the model
        try:
            classifier = load_model(model_path, 
                                    custom_objects = {'dice_coef_loss': self.dice_coef_loss, 
                                                        'dice_coef': self.dice_coef}
                                    )
        except Exception as error:
            print(error)
            print("Model doesn't exist for "+str(model_path))
            return {}


        #performs statistical analysis and returns the result
        results = self.prediction_analysis(classifier=classifier, feature_dataset=X, full_label_dataset=Y, batch_size=5, verbose=verbose)

        return results


    """
    performs predictions and subsequent statistic calculations on unofficial test dataset
    """
    @abstractmethod
    def test(self, project, classification_type, model_arch, date_to_retrieve, training_session_num, dataset_size):

        training_session_path = self.data_handler.get_training_session_path(project, classification_type, model_arch, date_to_retrieve, training_session_num)

        file_list = os.listdir(training_session_path)


        model_paths = []
        statistical_results = []


        for file in file_list:
            if ".h5" in file:
                model_path = training_session_path+"/"+file
                print("Model path: "+str(model_path))
                model_paths.append(model_path)

                stat_results = self.test_model(model_path=model_path, dataset_size=dataset_size, verbose=False)

                statistical_results.append(stat_results)
        print()
        print()


        print("-- Results --")
        for x in range(0, len(statistical_results)):
            print("Model "+str(model_paths[x]))
            self.print_statistical_measures(statistical_results[x][0][0])

        print()


"""

Handles binary classification training, validation, and testing

"""
class BinaryClassifier(Classifier):
    def __init__(self, project):
        super().__init__(project)

    """
    creates CNN sculpted for binary classification
    """
    def create_CNN(self):
        CNN_size = self.hyperparameters['binary']['cnn']['conv_layer_size']
        num_conv_layers = self.hyperparameters['binary']['cnn']['num_conv_layers']
        pool_size = (self.hyperparameters['binary']['cnn']['pool_size'], self.hyperparameters['binary']['cnn']['pool_size'])
        filter_size = (self.hyperparameters['binary']['cnn']['filter_size'], self.hyperparameters['binary']['cnn']['filter_size'])
        CNN_activation = self.hyperparameters['binary']['cnn']['conv_activation']
        dense_activation = self.hyperparameters['binary']['cnn']['dense_activation']
        output_activation = self.hyperparameters['binary']['cnn']['output_activation']
        loss = self.hyperparameters['binary']['cnn']['loss']
        optimizer = self.hyperparameters['binary']['cnn']['optimizer']
        last_layer_size = self.hyperparameters['binary']['cnn']['last_layer_size']
        dropout = self.hyperparameters['binary']['cnn']['dropout']
        weight_regularization = self.hyperparameters['binary']['cnn']['weight_regularization']
        activation_regularization = self.hyperparameters['binary']['cnn']['activation_regularization']
        weight_limit = self.hyperparameters['binary']['cnn']['weight_limit']
        noise_amount = self.hyperparameters['binary']['cnn']['noise_std']
        batch_normalization = self.hyperparameters['binary']['cnn']['batch_normalization']

        if loss=="dice_coef_loss":
            loss = self.dice_coef_loss

        metrics = "accuracy"
        # metrics = self.dice_coef


        classifier = Sequential()


        # Step 2 - Pooling
        #pooling uses a 2x2 or something grid (most of the time is 2x2), goes over the feature maps, and the largest values as its going over become the values in the pooled map
        #slides with a stride of 2. At the end, the pool map should be (length/2)x(width/2)


        classifier.add(Conv2D(CNN_size, filter_size, 
                            input_shape = (self.image_width, self.image_height, 1), 
                            padding="same", 
                            kernel_initializer='he_uniform', #Initializes weights
                            kernel_regularizer=l2(weight_regularization), #regularizes weights to avoid overfitting
                            activity_regularizer=l1(activation_regularization), #regularizes activation to avoid overfitting
                            kernel_constraint=max_norm(weight_limit))) #constrains weights to avoid exploding gradients
        classifier.add(Activation(CNN_activation))

        if batch_normalization:
            classifier.add(BatchNormalization())

        classifier.add(MaxPooling2D(pool_size = pool_size))

        if noise_amount>0:
            classifier.add(GaussianNoise(noise_amount)) #Adds noise

        #add dropout if not using batch normalization
        if not batch_normalization:
            classifier.add(Dropout(dropout))


        #adds hidden convolutional layers
        for x in range(1, num_conv_layers):
            classifier.add(Conv2D(CNN_size, filter_size, 
                                    padding="same", 
                                    kernel_initializer='he_uniform', 
                                    kernel_regularizer=l2(weight_regularization),
                                    activity_regularizer=l1(activation_regularization),
                                    kernel_constraint=max_norm(weight_limit)))
            classifier.add(Activation(CNN_activation))
            if batch_normalization:
                classifier.add(BatchNormalization())

            classifier.add(MaxPooling2D(pool_size = pool_size))

            # if batch_normalization:
            if noise_amount > 0:
                classifier.add(GaussianNoise(noise_amount)) #Adds noise

            #add dropout if not using batch normalization
            if not batch_normalization:
                classifier.add(Dropout(dropout))


        #flattents the layers
        classifier.add(Flatten())

        #128 is an arbitrary number that can be decreased to lower computation time, and increased for better accuracy
        classifier.add(Dense(units = last_layer_size, activation = dense_activation))
        if not batch_normalization:
            classifier.add(Dropout(dropout))

        classifier.add(Dense(units = 1, activation = output_activation))

        classifier.compile(optimizer = optimizer, loss = loss, metrics = [metrics])

        print("Creating CNN")
        classifier.summary()

        return classifier


    """
    creates and returns U-net architecture model
    """
    def create_Unet(self):
        start_size = self.hyperparameters['binary']['unet']['start_size']
        pool_size = (self.hyperparameters['binary']['unet']['pool_size'],self.hyperparameters['binary']['unet']['pool_size'])
        filter_size = (self.hyperparameters['binary']['unet']['filter_size'],self.hyperparameters['binary']['unet']['filter_size'])
        conv_activation = self.hyperparameters['binary']['unet']['conv_activation']
        dense_activation = self.hyperparameters['binary']['unet']['dense_activation']
        output_activation = self.hyperparameters['binary']['unet']['output_activation']
        loss = self.hyperparameters['binary']['unet']['loss']
        optimizer = self.hyperparameters['binary']['unet']['optimizer']
        last_layer_size = self.hyperparameters['binary']['unet']['last_layer_size']
        batch_normalization = self.hyperparameters['binary']['unet']['batch_normalization']
        depth = self.hyperparameters['binary']['unet']['depth']

        dropout = self.hyperparameters['binary']['unet']['dropout']
        weight_regularization = self.hyperparameters['binary']['unet']['weight_regularization']
        activation_regularization = self.hyperparameters['binary']['unet']['activation_regularization']
        weight_limit = self.hyperparameters['binary']['unet']['weight_limit']
        noise_amount = self.hyperparameters['binary']['unet']['noise_std']


        if loss=="dice_coef_loss":
            loss = self.dice_coef_loss

        if optimizer=="adam":
            optimizer = Adam(lr=1e-5)


        def create_conv_layer(size):
            return Conv2D(size, 
                        filter_size, 
                        activation=conv_activation, 
                        padding='same', 
                        kernel_initializer='he_uniform', #Initializes weights
                        kernel_regularizer=l2(weight_regularization), #regularizes weights to avoid overfitting
                        activity_regularizer=l1(activation_regularization), #regularizes activation to avoid overfitting
                        kernel_constraint=max_norm(weight_limit))


        #returns tuple where 0th element is the convolutional layer, and the 1st is the pooling layer
        def create_downscale_layer(size, prev_layer):
            conv = create_conv_layer(size)(prev_layer)
            conv = create_conv_layer(size)(conv)
            if batch_normalization:
                conv = BatchNormalization()(conv)

            pool = MaxPooling2D(pool_size=pool_size)(conv)

            return conv, pool

        #returns tuple where 0th element is the convolutinal layer, and the 1st is the upscale layer
        def create_upscale_layer(size, prev_layer, level_layer):
            up = concatenate([Conv2D(size, pool_size, activation=conv_activation, padding='same')(UpSampling2D(size=pool_size)(prev_layer)), level_layer], axis=3)
            conv = create_conv_layer(size)(up)
            conv = create_conv_layer(size)(conv)
            if batch_normalization:
                conv = BatchNormalization()(conv)

            return conv, up


        inputs = Input((self.image_width, self.image_height, 1))
        

        downscale_layers = [] #list of tuples of downscaling layers
        upscale_layers = [] #list of tuples of upscaling layers


        downscale_layers.append((inputs,inputs)) #adds the first layer

        #If N = depth, there will be N downscaling layers and N-1 upscaling layers
        for x in range(0, depth):
            layer_size = start_size*(2**(x))
            conv, pool = create_downscale_layer(layer_size, downscale_layers[-1][1])
            downscale_layers.append((conv, pool))

        #adds initial upscale layer, which is the previous downscale layer
        upscale_layers.append(downscale_layers[-1])

        #There will be depth-1 upscaling layers
        for x in range(depth-1, 0, -1):
            layer_size = start_size*(2**(x-1))
            conv, pool = create_upscale_layer(layer_size, upscale_layers[-1][0], downscale_layers[x][0])
            upscale_layers.append((conv, pool))


        last_conv, last_up = upscale_layers[-1]

        conv_1d = Convolution2D(1, (1, 1), activation=conv_activation)(last_conv)


        #flattens the layers
        dense1 = Flatten()(conv_1d)
        dense1 = Dense(units = last_layer_size, activation = dense_activation)(dense1)
        dense2 = Dense(units = 1, activation = output_activation)(dense1)
        dense2 = Dropout(dropout)(dense2)

        #joins the CNN with the dense layers
        model = Model(inputs=inputs, outputs=dense2)

        # model.compile(optimizer=Adam(lr=1e-5), loss=self.dice_coef_loss, metrics=[self.dice_coef])
        model.compile(optimizer=optimizer, loss=loss, metrics=["accuracy"])

        print("Creating u-net")
        model.summary()

        return model

    """
    creates custom data generator specific for labels of type binary
    """
    def create_data_generator(self, feature_dataset, label_dataset, batch_size, step="train"):
        params = self.get_data_generator_params(step=step)

        generator = DataGenerator(feature_dataset, label_dataset, batch_size, "binary", **params)
        return generator


    """
    returns list of size 1 of confusion matrix
    """
    def calculate_confusion_matrices(self, target_data, prediction_data):

        prediction_data = np.array(prediction_data)

        #calculates confusion matrix
        conf_matrix = confusion_matrix(target_data, prediction_data)

        return [conf_matrix]


    def train_evaluate(self, model_arch="cnn", training_type="regular"):
        super().train_evaluate(classification_type="binary", model_arch=model_arch, training_type=training_type)


    def test(self, project, model_arch, date_to_retrieve, training_session_num, dataset_size):
        super().test(project, "binary", model_arch, date_to_retrieve, training_session_num, dataset_size)


    def view_training_session_results(self, project, model_arch, date, session_num):
        super().view_training_session_results(project, "binary", model_arch, date, session_num)


"""

Handles segmentation classification training, validation, and testing

"""
class SegmentationClassifier(Classifier):
    def __init__(self, project):
        super().__init__(project)

    """
    creates CNN sculpted for binary classification
    """
    def create_CNN(self):
        CNN_size = self.hyperparameters['segmentation']['cnn']['conv_layer_size']
        num_conv_layers = self.hyperparameters['segmentation']['cnn']['num_conv_layers']
        pool_size = (self.hyperparameters['segmentation']['cnn']['pool_size'], self.hyperparameters['segmentation']['cnn']['pool_size'])
        filter_size = (self.hyperparameters['segmentation']['cnn']['filter_size'], self.hyperparameters['segmentation']['cnn']['filter_size'])
        CNN_activation = self.hyperparameters['segmentation']['cnn']['conv_activation']
        dense_activation = self.hyperparameters['segmentation']['cnn']['dense_activation']
        output_activation = self.hyperparameters['segmentation']['cnn']['output_activation']
        loss = self.hyperparameters['segmentation']['cnn']['loss']
        optimizer = self.hyperparameters['segmentation']['cnn']['optimizer']
        last_layer_size = self.hyperparameters['segmentation']['cnn']['last_layer_size']
        dropout = self.hyperparameters['segmentation']['cnn']['dropout']
        weight_regularization = self.hyperparameters['segmentation']['cnn']['weight_regularization']
        activation_regularization = self.hyperparameters['segmentation']['cnn']['activation_regularization']
        weight_limit = self.hyperparameters['segmentation']['cnn']['weight_limit']
        noise_amount = self.hyperparameters['segmentation']['cnn']['noise_std']
        batch_normalization = self.hyperparameters['segmentation']['cnn']['batch_normalization']

        if loss=="dice_coef_loss":
            loss = self.dice_coef_loss

        metrics = self.dice_coef


        classifier = Sequential()


        # Step 2 - Pooling
        #pooling uses a 2x2 or something grid (most of the time is 2x2), goes over the feature maps, and the largest values as its going over become the values in the pooled map
        #slides with a stride of 2. At the end, the pool map should be (length/2)x(width/2)


        classifier.add(Conv2D(CNN_size, filter_size, 
                            input_shape = (self.image_width, self.image_height, 1), 
                            padding="same", 
                            kernel_initializer='he_uniform', #Initializes weights
                            kernel_regularizer=l2(weight_regularization), #regularizes weights to avoid overfitting
                            activity_regularizer=l1(activation_regularization), #regularizes activation to avoid overfitting
                            kernel_constraint=max_norm(weight_limit))) #constrains weights to avoid exploding gradients
        classifier.add(Activation(CNN_activation))

        if batch_normalization:
            classifier.add(BatchNormalization())

        classifier.add(MaxPooling2D(pool_size = pool_size))

        if noise_amount>0:
            classifier.add(GaussianNoise(noise_amount)) #Adds noise

        #add dropout if not using batch normalization
        if not batch_normalization:
            classifier.add(Dropout(dropout))


        #adds hidden convolutional layers
        for x in range(1, num_conv_layers):
            classifier.add(Conv2D(CNN_size, filter_size, 
                                    padding="same", 
                                    kernel_initializer='he_uniform', 
                                    kernel_regularizer=l2(weight_regularization),
                                    activity_regularizer=l1(activation_regularization),
                                    kernel_constraint=max_norm(weight_limit)))
            classifier.add(Activation(CNN_activation))
            if batch_normalization:
                classifier.add(BatchNormalization())

            classifier.add(MaxPooling2D(pool_size = pool_size))

            # if batch_normalization:
            if noise_amount > 0:
                classifier.add(GaussianNoise(noise_amount)) #Adds noise

            #add dropout if not using batch normalization
            if not batch_normalization:
                classifier.add(Dropout(dropout))


        # #flattents the layers
        # classifier.add(Flatten())

        # #128 is an arbitrary number that can be decreased to lower computation time, and increased for better accuracy
        # classifier.add(Dense(units = last_layer_size, activation = dense_activation))
        # if not batch_normalization:
        #     classifier.add(Dropout(dropout))

        # classifier.add(Dense(units = 1, activation = output_activation))

        classifier.add(Conv2D(1, (1, 1), activation=output_activation))

        classifier.compile(optimizer = optimizer, loss = loss, metrics = [metrics])

        print("Creating CNN")
        classifier.summary()

        print()
        print()
        print("--- Unavailable ---")
        print()

        return classifier

    
    """
    creates and returns U-net architecture model
    """
    def create_Unet(self):
        start_size = self.hyperparameters['segmentation']['unet']['start_size']
        pool_size = (self.hyperparameters['segmentation']['unet']['pool_size'],self.hyperparameters['segmentation']['unet']['pool_size'])
        filter_size = (self.hyperparameters['segmentation']['unet']['filter_size'],self.hyperparameters['segmentation']['unet']['filter_size'])
        conv_activation = self.hyperparameters['segmentation']['unet']['conv_activation']
        output_activation = self.hyperparameters['segmentation']['unet']['output_activation']
        loss = self.hyperparameters['segmentation']['unet']['loss']
        optimizer = self.hyperparameters['segmentation']['unet']['optimizer']
        last_layer_size = self.hyperparameters['segmentation']['unet']['last_layer_size']
        batch_normalization = self.hyperparameters['segmentation']['unet']['batch_normalization']
        depth = self.hyperparameters['segmentation']['unet']['depth']

        dropout = self.hyperparameters['segmentation']['unet']['dropout']
        weight_regularization = self.hyperparameters['segmentation']['unet']['weight_regularization']
        activation_regularization = self.hyperparameters['segmentation']['unet']['activation_regularization']
        weight_limit = self.hyperparameters['segmentation']['unet']['weight_limit']
        noise_amount = self.hyperparameters['segmentation']['unet']['noise_std']


        if loss=="dice_coef_loss":
            loss = self.dice_coef_loss

        if optimizer=="adam":
            optimizer = Adam(lr=1e-5)


        def create_conv_layer(size):
            return Conv2D(size, 
                        filter_size, 
                        activation=conv_activation, 
                        padding='same', 
                        kernel_initializer='he_uniform', #Initializes weights
                        kernel_regularizer=l2(weight_regularization), #regularizes weights to avoid overfitting
                        activity_regularizer=l1(activation_regularization), #regularizes activation to avoid overfitting
                        kernel_constraint=max_norm(weight_limit))


        #returns tuple where 0th element is the convolutional layer, and the 1st is the pooling layer
        def create_downscale_layer(size, prev_layer):
            conv = create_conv_layer(size)(prev_layer)
            conv = create_conv_layer(size)(conv)
            if batch_normalization:
                conv = BatchNormalization()(conv)

            pool = MaxPooling2D(pool_size=pool_size)(conv)

            return conv, pool

        #returns tuple where 0th element is the convolutinal layer, and the 1st is the upscale layer
        def create_upscale_layer(size, prev_layer, level_layer):
            up = concatenate([Conv2D(size, pool_size, activation=conv_activation, padding='same')(UpSampling2D(size=pool_size)(prev_layer)), level_layer], axis=3)
            conv = create_conv_layer(size)(up)
            conv = create_conv_layer(size)(conv)
            if batch_normalization:
                conv = BatchNormalization()(conv)

            return conv, up


        inputs = Input((self.image_width, self.image_height, 1))
        

        downscale_layers = [] #list of tuples of downscaling layers
        upscale_layers = [] #list of tuples of upscaling layers


        downscale_layers.append((inputs,inputs)) #adds the first layer

        #If N = depth, there will be N downscaling layers and N-1 upscaling layers
        for x in range(0, depth):
            layer_size = start_size*(2**(x))
            conv, pool = create_downscale_layer(layer_size, downscale_layers[-1][1])
            downscale_layers.append((conv, pool))

        #adds initial upscale layer, which is the previous downscale layer
        upscale_layers.append(downscale_layers[-1])

        #There will be depth-1 upscaling layers
        for x in range(depth-1, 0, -1):
            layer_size = start_size*(2**(x-1))
            conv, pool = create_upscale_layer(layer_size, upscale_layers[-1][0], downscale_layers[x][0])
            upscale_layers.append((conv, pool))

        last_conv, last_up = upscale_layers[-1]


        conv_1d = Conv2D(last_layer_size, (1, 1), activation=output_activation)(last_conv)


        model = Model(inputs=inputs, outputs=conv_1d)

        model.compile(optimizer=optimizer, loss=loss, metrics=[self.dice_coef])


        print("Creating u-net")
        model.summary()

        return model


    """
    creates custom data generator specific for labels of type segments
    """
    def create_data_generator(self, feature_dataset, label_dataset, batch_size, step="train"):
        params = self.get_data_generator_params(step=step)

        #can't easily augment, because that'll change mask/label positions
        params['augment'] = False

        generator = DataGenerator(feature_dataset, label_dataset, batch_size, "segment", **params)
        return generator

    """
    returns list of size 1 of confusion matrix
    """
    def calculate_confusion_matrices(self, target_data, prediction_data):


        prediction_data = np.array(prediction_data)

        #calculates confusion matrix on each image for the pixels
        confusion_matrices = []
        for x in range(0, target_data.shape[0]):

            #flattens 512x512x1 True/False 2D array into 262144 list of True/False
            targets = target_data[x].flatten()
            predictions = prediction_data[x].flatten()

            #calculates confusion matrix
            conf_matrix = confusion_matrix(targets, predictions)

            confusion_matrices.append(conf_matrix)

        return confusion_matrices

    """
    trains segmentation with specified hyperparameters
    """
    def train_evaluate(self, model_arch="cnn", training_type="regular"):
        super().train_evaluate(classification_type="segmentation", model_arch=model_arch, training_type=training_type)


    def test(self, project, model_arch, date_to_retrieve, training_session_num, dataset_size):
        super().test(project, "segmentation", model_arch, date_to_retrieve, training_session_num, dataset_size)


    def view_training_session_results(self, project, model_arch, date, session_num):
        super().view_training_session_results(project, "segmentation", model_arch, date, session_num)


if __name__=="__main__":
    classifier = BinaryClassifier("chest_radiograph")
    # classifier = SegmentationClassifier()

    # CNN_classifier.train(dataset_size=200)

    classifier.train(model_arch="cnn", dataset_size=10)
    # classifier.test(model_arch="unet", dataset_size=10)