deepClass.py

import numpy as np
import os
import sys
import pickle
import time
import json

from functions import *
from conv import *
from visual import *

class DeepLearner():

    #initialize class
    def __init__(self, learning_type="classic", random_seed=123):

        #basic settings for training
        self.learning_type = learning_type
        self.random_seed = random_seed

        #default settings for training
        self.layer_dims = [4,3,2]
        self.layer_activation = ["relu","relu","relu"]
        self.numberIterations = 10000
        self.batch_size = 50
        self.costType = "crossEntropy"
        self.costParams = []
        self.scoreMetrics = ["accuracy"]
        self.learning_rate = 0.01
        self.threshold = 0.5
        self.numClasses = None
        self.early_stopping = None
        self.class_weight = None
        self.epsilon = True

        #default settings for cnn
        self.filters = None
        self.filterX = 3
        self.filterY = 3
        self.numFilters = 8
        self.filterBias = 0
        self.filterStride = 1
        self.poolSize = 2
        self.poolStride = 2

        #params for history
        self.params = None
        self.costHistory = None
        self.scoreHistory = None

        #other settings
        self.visual_mode = False
        self.debug_mode = False

    def initJit(self):
        try:
            from numba import cuda
            gpu = cuda.gpus
            target='cuda'
        except:
            target='cpu'
        print(target)

    #gives the possibility to change training parameters
    def setTrainingParams(self, layer_dims=None, layer_activation=None, numberIterations=None,
                          learning_rate=None, batch_size=None,
                          threshold=None, early_stopping = None,
                          costType=None, costParams=None, scoreMetrics=None, epsilon=None):

        if layer_dims is not None:
            self.layer_dims = layer_dims
        if layer_activation is not None:
            self.layer_activation = layer_activation
        if numberIterations is not None:
            self.numberIterations = numberIterations
        if learning_rate is not None:
            self.learning_rate = learning_rate
        if batch_size is not None:
            self.batch_size = batch_size
        if threshold is not None:
            self.threshold = threshold
        if early_stopping is not None:
            self.early_stopping = early_stopping
        if costType is not None:
            self.costType = costType
        if costParams is not None:
            self.costParams = costParams
        if scoreMetrics is not None:
            self.scoreMetrics = scoreMetrics
        if epsilon is not None:
            self.epsilon = epsilon

    #gives the possibility to change cnn parameters
    def setCnnParams(self, filterX = None, filterY = None, numFilters = None,
                     filterBias = None, filterStride=None,
                     poolSize=None, poolStride=None):

        if filterX is not None:
            self.filterX = filterX
        if filterY is not None:
            self.filterY = filterY
        if numFilters is not None:
            self.numFilters = numFilters
        if filterBias is not None:
            self.filterBias = filterBias
        if filterStride is not None:
            self.filterStride = filterStride
        if poolSize is not None:
            self.poolSize = poolSize
        if poolStride is not None:
            self.poolStride = poolStride

    #gives the possibility to change some settings
    def setSettings(self, visual_mode=None, debug_mode=None):
        if visual_mode is not None:
            self.visual_mode = visual_mode

        if debug_mode is not None:
            self.debug_mode = debug_mode

    #train the network
    def optimize(self, X_input, Y_input, verbose=False, verbose_iter=100):

        #check data and settings for consistency
        checkErrors(self.layer_activation, self.layer_dims, X_input, Y_input)

        #set random_seed
        np.random.seed(self.random_seed)

        #copy data in order not to change the original data
        X = np.asarray(X_input).copy()
        Y = np.asarray(Y_input).copy()

        #count number of classes
        self.numClasses = len(np.unique(Y, return_counts=False))
        if self.numClasses == 2: #if number of classes is 2 it can be treated as 1 class (binary )
            self.numClasses = 1

        #check input values have NaN values
        if (hasNaN(X)):
            print("X has NaN-values. These are replaced with 0")
            X[np.isnan(X)] = 0

        #save image params if it is a cnn
        if self.learning_type == "cnn":
            imgSizeX = X.shape[1]
            imgSizeY = X.shape[2]
            imgShape = [imgSizeX, imgSizeY]

        #normalize image if cnn
        if self.learning_type == "cnn":
            X = (X / 255) - 0.5

        #reshape X the structure this NN is working with
        X = reshape(X) #(features, number of entries)
        Y = reshape(Y) #(number of classes, number of entries)

        #adapt layer (add input and output layer)
        self.layer_dims = adapt_layer(self.layer_dims, self.layer_activation, X.shape[0], self.numClasses)

        #init weight and bias
        self.params = init_params(self.layer_dims)

        #init the visualization mode
        if self.visual_mode:
            visual = Visual()
            visual.drawNetwork(self.layer_dims, self.layer_activation,
                               self.params, Y)
            visual.show()

        #init filters if it is a cnn
        if self.learning_type == "cnn":
            self.filters = init_filters(self.filterX, self.filterY, self.numFilters)

        #create empty list to save history
        self.costHistory = []
        self.scoreHistory = []

        #set params for early stopping
        maxCost = sys.maxsize #get maximum number so that first cost is def. lower
        maxScores = []
        stopCounter = 0
        bestParams = []
        bestFilters = []

        #set variable for the changing of the input layer if cnn
        if self.learning_type == "cnn":
            inputLayerChanged = False

        #start training
        for epoch in range(self.numberIterations):

            batches = createBatches(X, self.batch_size)
            batches_Y = createBatches(Y, self.batch_size)

            #get start time to measure how long a round will take
            rStart = time.time()

            #iterate batches
            for bt in range(len(batches)):

                #get batch
                batch = batches[bt]
                batch_y = batches_Y[bt]

                #execute cnn forward propagation
                if self.learning_type == "cnn":

                    #copy batch for later use in cnn
                    batch_orig = batch.copy()

                    output = debug(self.debug_mode, cnn_forward_prop, [
                                                batch_orig, self.filters, imgShape,
                                                self.filterStride, self.filterBias,
                                                self.poolStride, self.poolSize])
                    batch, filteredCache = output[0], output[1]

                    #when applying the filters and downsample the input size
                    #is changing and needs to be adapted only once
                    if inputLayerChanged == False:

                        #change input layer
                        self.layer_dims = changeInputLayer(self.layer_dims, X.shape[0])

                        #with new layer_dims new params are needed
                        self.params = init_params(self.layer_dims)

                        #set bool so that the whole if clause is only done once
                        inputLayerChanged = True

                #execute forward propagation
                output = debug(self.debug_mode, forward_prop, [batch, self.params, self.layer_activation])
                AL, cache = output[0], output[1]

                #compute cost and save
                output = debug(self.debug_mode, compute_cost, [AL, batch_y, self.numClasses, self.costType, self.epsilon, self.costParams])
                cost = output[0]

                #compute scores and save
                if len(self.scoreMetrics) > 0:
                    output = debug(self.debug_mode, compute_scores, [self.scoreMetrics, AL, batch_y, self.numClasses, self.threshold])
                    scores = output[0]

                #check if cost is improving
                if cost < maxCost:
                    stopCounter = 0

                    #save best cost and scores
                    maxCost = cost
                    maxScores = scores

                    #save params and filters of best cost
                    bestParams = self.params
                    if self.learning_type == "cnn":
                        bestFilters = self.filters

                #increase stop counter for early stopping
                stopCounter +=1

                #execute backwards propagation
                output = debug(self.debug_mode, backward_prop, [AL, batch_y, self.params, self.layer_activation, cache, self.numClasses, self.costType, self.costParams])
                grads = output[0]

                #execute cnn backwards propagation
                if self.learning_type == "cnn":

                    output = debug(self.debug_mode, cnn_backward_prop, [grads["dA0"], batch_orig, imgShape, filteredCache, self.filters])
                    filterGrads = output[0]

                #update parameters
                output = debug(self.debug_mode, update_params, [self.params, self.layer_activation, grads, self.learning_rate])
                self.params = output[0]

                #update filter if necessary
                if self.learning_type == "cnn":

                    output = debug(self.debug_mode, update_filters, [self.filters, filterGrads, self.learning_rate])
                    self.filters = output[0]

            #stop if cost is not improving
            if self.early_stopping is not None:
                if stopCounter == self.early_stopping:

                    #get old params
                    self.params = bestParams
                    if self.learning_type == "cnn":
                        self.filters = bestFilters

                    #remove last n entries from history
                    self.costHistory = self.costHistory[:len(self.costHistory)-self.early_stopping]
                    self.scoreHistory = self.scoreHistory[:len(self.scoreHistory)-self.early_stopping]

                    if verbose:
                        scoreString = ", "
                        for j, elem in enumerate(self.scoreMetrics):
                            scoreString = scoreString + elem + ": " + str(round(maxScores[j], 3)) + ", "
                        scoreString = scoreString[:-2]
                        print("Early stopping after round " + str(epoch-self.early_stopping+1) + " cost: " + str(round(maxCost, 10)) + scoreString + " (" + rDura + ")")

                    #exit the loop as no improvement was done
                    break

            #get start time to measure how long a round will take
            rEnd = time.time()
            rDura = str(round(rEnd - rStart, 4)) + "s"

            #todo rDura that time for all n things is summed (like for example 50)

            #print out cost
            if verbose and epoch%verbose_iter == 0:
                scoreString = ", "
                for j, elem in enumerate(self.scoreMetrics):
                    scoreString = scoreString + elem + ": " + str(round(scores[j], 3)) + ", "
                scoreString = scoreString[:-2]
                print("Round " + str(epoch) + " cost: " + str(round(cost, 10)) + scoreString + " (" + rDura + ")")

    #classify input and returns the probability
    def predictProba(self, X_input):

        X = np.asarray(X_input).copy()

        ## TODO: check if data is prepared or not and only do if not prepared
        X = reshape(X)

        #calculate probs
        probas, caches = forward_prop(X, self.params, self.layer_activation)

        #Transpose to have probs per elem
        probas = probas.T

        return(probas)

    #classify input with most likely class
    def predict(self, X_input, threshold=0.5):

        #get probability vector
        vec = self.predictProba(X_input)

        #get maximum index
        y_pred = np.argmax(vec, axis=1)

        return y_pred

    #save model to file
    def saveModel(self, filename, path=os.getcwd(), format="pickle"):

        #save all parameters in a dict
        modelDict = {}

        #fill dict with learning type
        modelDict["learning_type"] = self.learning_type

        #fill dict with training settings
        modelDict["layer_dimns"] = self.layer_dims
        modelDict["layer_activation"] = self.layer_activation
        modelDict["numberIterations"] = self.numberIterations
        modelDict["learning_rate"] = self.learning_rate
        modelDict["threshold"] = self.threshold
        modelDict["costType"] = self.costType
        modelDict["scoreMetrics"] = self.scoreMetrics

        #fill dict with cnn settings
        if self.learning_type == "cnn":
            modelDict["filterX"] = self.filterX
            modelDict["filterY"] = self.filterY
            modelDict["numFilters"] = self.numFilters
            modelDict["filterBias"] = self.filterBias
            modelDict["filterStride"] = self.filterStride
            modelDict["poolSize"] = self.poolSize
            modelDict["poolStride"]= self.poolStride

        #fill dict with training results
        modelDict["params"] = self.params
        if self.learning_type == "cnn":
            modelDict["filters"] = self.filters

        #fill dict with history
        modelDict["costHistory"] = self.costHistory
        modelDict["scoreHistory"] = self.scoreHistory

        #save file as pickle file
        if format == "pickle":
            if (filename.endswith(".pkl")):
                filename = filename[:-4]
            f = open(path + "/" + filename + ".pkl", "wb")
            pickle.dump(modelDict,f)
            f.close()

        #save file as txt
        elif format == "txt":
            if (filename.endswith(".txt")):
                filename = filename[:-4]

        #save file as json
        elif format == "json":
            if (filename.endswith(".json")):
                filename = filename[:-5]

            #change nd array to list
            for key in modelDict["params"]:
                modelDict["params"][key] = modelDict["params"][key].tolist()

            with open(path + "/" + filename + ".json", 'w') as fp:
                json.dump(modelDict, fp, indent=4)

        #save file as csv
        elif format == "csv":
            if (filename.endswith(".csv")):
                filename = filename[:-4]

        else:
            raise ValueError("this format is not supported")

    #load model from dict and save values to class
    def loadModel(self, path):
        fileType = path[-3:]

        if not os.path.exists(path):
            raise ValueError("No file could be found at this location")



        # TODO: do other types
        if fileType == "pkl":
            file = open(path, 'rb')
            modelDict = pickle.load(file)
            file.close()
        elif fileType == "son":
            file = open(path, 'rb')
            jsonString = file.read()
            modelDict = json.loads(jsonString)
            file.close()
        else:
            raise ValueError("this format is not supported")

        try:
            #restore learning type
            self.learning_type = modelDict["learning_type"]

            #restore training settings
            self.layer_dims = modelDict["layer_dimns"]
            self.layer_activation = modelDict["layer_activation"]
            self.numberIterations = modelDict["numberIterations"]
            self.learning_rate = modelDict["learning_rate"]
            self.threshold = modelDict["threshold"]
            self.costType = modelDict["costType"]
            self.scoreMetrics = modelDict["scoreMetrics"]

            #restore cnn settings
            if modelDict["learning_type"] == "cnn":
                self.filterX = modelDict["filterX"]
                self.filterY = modelDict["filterY"]
                self.numFilters = modelDict["numFilters"]
                self.filterBias = modelDict["filterBias"]
                self.filterStride = modelDict["filterStride"]
                self.poolSize = modelDict["poolSize"]
                self.poolStride = modelDict["poolStride"]

            #restore training results
            self.params = modelDict["params"]
            if modelDict["learning_type"] == "cnn":
                self.filters = modelDict["filters"]

            #restore history
            self.costHistory = modelDict["costHistory"]
            self.scoreHistory = modelDict["scoreHistory"]
        except:
            raise ValueError("The model file is corrupted.")

    #plot training graph
    def plotTraining(self, type):

        if type == "cost":
            costs = np.squeeze(self.costHistory)
            plt.plot(costs)
            plt.ylabel(type)
            plt.xlabel('iterations (in 100)')
            plt.title('Learning rate =' + str(self.learning_rate))
            plt.show()

        if type == "accuracy":
            costs = np.squeeze(self.accuracyHistory)
            plt.plot(costs)
            plt.ylabel(type)
            plt.xlabel('iterations (in 100)')
            plt.title('Learning rate =' + str(self.learning_rate))
            plt.show()