functions.r

# To do:
#
# - Color by batch, treatment, replicate, ....
# - Plotly lasso to select images
# - Summarize multiple measurements simultaneously


#
# Generic functions
#
loadpackage <- function(pckg){
    if(!(pckg %in% installed.packages())){
        install.packages(pckg)
    }
    library(pckg, character.only=TRUE)
}

# Print a string to the R console and to the webpage
echo <- function(...){
    temp <- do.call("paste0", list(...))
    print(temp)
    message(temp)
}


# Reads a data.frame from csv, tsv, and xlsx files. Does not read the older xls format.
# The file format can be explicitly mentioned or auto-detected.
read.HTMtable <- function(filepath, filetype = c("Auto", "csv", "tsv", "xlsx"), decimalseparator = c("Auto", ".", ",")){

    # filepath : full path to file. includes the filename. In Windows this is a temporary folder where the file is named '0'
    # filename : original filename

    loadpackage("openxlsx")

    if(filetype == "Auto" | missing(filetype)){
        
        tryCatch({
            temp       <- read.delim(filepath, header = T, as.is = T, stringsAsFactors = FALSE)
            temp       <- read.table(filepath, sep = "\t", nrows = 10, stringsAsFactors = FALSE)
            fileheader <- readLines(filepath, n = 1)
            
            if(grepl("\t", fileheader)){
                filetype <- "tsv"
            } else{
                filetype <- "csv"
            }
        },
            
        warning = function(e){
            filetype <<- "xlsx"
        })
    }

    if(filetype == "csv"){
        tryCatch(
            return( read.table(filepath, header = TRUE, sep = ",", dec = ".", fill = TRUE, as.is = TRUE, stringsAsFactors = FALSE) ),
            error = function(e) filetype == "invalid"
        )
    }
    
    if(filetype == "tsv"){
        tryCatch(
            {

                # Auto detect decimal separator
                if(decimalseparator == "Auto" | missing(decimalseparator)){

                    sampledata_df          <- read.table(filepath, header = TRUE, sep = "\t", nrows = 100, colClasses = "character", fill = TRUE, as.is = TRUE, stringsAsFactors = FALSE)
                    sampledata_char        <- as.character(as.matrix(sampledata_df))
                    
                    sampledata_with_dots   <- grep("\\.", sampledata_char, value = TRUE)
                    sampledata_with_1dot   <- sampledata_with_dots[!grepl("\\..*\\.", sampledata_with_dots)]
                    sampledata_with_commas <- grep(",", sampledata_char, value = TRUE)
                    sampledata_with_1comma <- sampledata_with_commas[!grepl(",.,", sampledata_with_commas)]
                    
                    # Let us imagine the true decimal separator is "."
                    sampledata_dotseparated <- sampledata_with_1dot[!is.na(as.numeric(sampledata_with_1dot))]
                    n_dotseparated          <- length(sampledata_dotseparated)
                    
                    # Let us imagine the true decimal separator is ","
                    sampledata_commaseparated <- gsub(",", "\\.", sampledata_with_1comma)
                    sampledata_commaseparated <- sampledata_commaseparated[!is.na(as.numeric(sampledata_commaseparated))]
                    n_commaseparated          <- length(sampledata_commaseparated)
                    
                    # Decide based on the most abundant
                    if(n_commaseparated > n_dotseparated){
                        decimalseparator <- ","
                    } else{
                        decimalseparator <- "."
                    }
                }

                return( read.table(filepath, header = TRUE, sep = "\t", dec = decimalseparator, fill = TRUE, as.is = TRUE, stringsAsFactors = FALSE) )
            },
            error = function(e) filetype == "invalid"
        )
    }
    
    if(filetype == "xlsx"){
        tryCatch(
            return( read.xlsx(filepath) ),
            error = function(e) filetype == "invalid"
        )
    }
    
    if(filetype == "invalid"){
        return( NULL )
    }
    
}


filterDataFrame <- function( df, x_col, y_col, batch_col, batch, highlightQCfailed, filterByColumn, whichValues, col_QC, subsampledata = FALSE, XAxisType = "continuous", subsampleN = 10, extremevalues = 10){

    # Subset batches
    if( ! is.null( batch_col ) & ! is.null( batch ) ) {
        if ( batch != "All batches" ) {
            df <- df[ df[[batch_col]] == batch, ]
        }
    }
    
    # Subset by columns
    if( !is.null( whichValues) & !is.null(filterByColumn) )
    {
        if( filterByColumn != "None" ) {
            if( !("All" %in% whichValues)  ) {
                OKrows <- sapply( df[[ filterByColumn ]], function(x)
                {
                    x %in% whichValues
                })
                df <- df[OKrows,]
            }
        }    
    }
    
    # Hide rejected data points if requested
    if( !is.null( highlightQCfailed) & !is.null(col_QC) )
    {
        if( highlightQCfailed == "Don't show" )
        {
            df <- df[df[[col_QC]],]
        }
    }
    
    # Subsample data frame
    if(subsampledata){
        
        # Decide how to do the subsampling
        switch(XAxisType, 
            "continuous" = {
                
                # The X axis is treated as a continuous numerical variable (i.e. there is only 1 category with continuous values)
                # This is the algorithm followed further below:
                #   1. Select the M highest and M lowest *of all y values* (These are the 'extreme values')
                #   2. Take all non-extreme values and show only 1 in each N (These are the 'subsampled values')
                #   3. Color the extreme values as green/red and subsampled values as black
                
                categories <- factor(rep(1, nrow(df)))
            },
            "categorical" = {
                
                # The X axis is treated as a categorical variable (each X value defines a category)
                # This is the algorithm followed further below:
                #   1. Split the data according according to their X values
                #   2. Select the M highest and M lowest values *of each X category* (These are the 'extreme values')
                #   3. Take all non-extreme values from each category and show only 1 in each N (These are the 'subsampled values')
                #   4. Color the extreme values as green/red and subsampled values as black
                
                categories <- factor(df[[x_col]])
            }
        )
             
        df_final <- by(df, categories, function(df_byCat){
            
            allvalues <- data.frame(x                = 1:nrow(df_byCat),
                                    values           = df_byCat[[y_col]],
                                    stringsAsFactors = FALSE)
            
            allvalues_numeric <- allvalues[!is.na(allvalues$values),]
            allvalues_numeric <- allvalues_numeric[order(allvalues_numeric$values, decreasing = TRUE),]
            
            # Row numbers of top and bottom M values
            rows_top    <- head(allvalues_numeric, n = extremevalues)[["x"]]
            rows_bottom <- tail(allvalues_numeric, n = extremevalues)[["x"]]
            
            # Row numbers of values which are not the top or bottom ones
            rows_others <- setdiff(allvalues$x, c(rows_top, rows_bottom))
            
            # Row numbers of each Nth row
            rows_sampled <- rows_others[seq(from = 1, to = length(rows_others), by = subsampleN)]
            
            # Assemble final data frame (extreme_low, extreme_high and subsampled values only)
            df_final0 <- df_byCat[c(rows_top, rows_bottom, rows_sampled),]
            df_final0$HTM_color <- c(rep("green3", extremevalues),
                                     rep("red", extremevalues),
                                     rep("black", length(rows_sampled)))
            df_final0
        })
        
        df_final <- do.call(rbind, df_final)

    } else{
        df_final <- df
    }

    return(df_final)
    
}


################################################################
# PLOTTING                                                     #
################################################################

    # Plotting UI
    ############################################################


    # Plot-generating functions
    ############################################################
    

# Generate Plotly scatter/jitter plot
pointPlot <- function( df, x, y, plottype, col_QC, highlightQCfailed, beeswarm = FALSE, splitBy = "None", colTreatment, colBatch, colColors ){

    # Initialize variables
    df$lineIndex <- 1:nrow(df)
    plotSymbols <- c( approved = 20, rejected = 4 )
    
    # Assign symbol to be used at each data point
    symbols <- if( highlightQCfailed == "Show with cross" ){
        sapply( df[[col_QC]], function(x) ifelse( x, plotSymbols["approved"], plotSymbols["rejected"] ) )
    } else{
        plotSymbols["approved"]
    }
    
    # Initialize colors
    if(is.null(colColors)){
        plotColors <- rep("black", nrow(df))
    } else{
        plotColors <- df[[colColors]]
    }
    names(plotColors) <- plotColors
    
    # # Decide what kind of plot to do: scatter, jitter or beeswarm;
    # plottype <- if(is.numeric( df[[x]] ) & is.numeric( df[[y]] )){
    #     "scatter"
    # } else{
    #     if(beeswarm){
    #         "beeswarm"
    #     } else{
    #         "jitter"
    #     }
    # }


    g <- ggplot(df, aes_string( paste0( "`", x,"`" ), paste0( "`", y,"`" ))) + ggtitle( colBatch ) + scale_colour_gradient2()
    
    
    # Generate plot object
    # SCATTER PLOT
    if(plottype == "scatter"){
        
        g <- g + geom_point(shape = symbols,
                aes(text = sprintf(
                "<br>Treatment: %s<br>Batch: %s<br>Line Index: %s", df[[colTreatment]], df[[colBatch]], df$lineIndex), color = plotColors)) +
                 scale_color_manual(values=plotColors) + 
                 theme(legend.position="none")
        
    }
    
    # BEESWARM
    if(plottype == "beeswarm"){
        
        g <- g + geom_quasirandom(shape = symbols, aes(text = sprintf("<br>Treatment: %s<br>Batch: %s<br>Line Index: %s", df[[colTreatment]], df[[colBatch]], df$lineIndex), color = plotColors)) + 
                 scale_color_manual(values=plotColors) + 
                 theme(legend.position="none")
    }
    
    # JITTER
    if(plottype == "jitter"){
        
        jitteramount = 0.2
        
        # Jitter non-numerical axis
        if(class(df[[x]]) %in% c("integer", "numeric")){
            jitterX <- 0
        } else{
            jitterX <- jitteramount  
        }
        if(class(df[[y]]) %in% c("integer", "numeric")){
            jitterY <- 0
        } else{
            jitterY <- jitteramount  
        }
        
        g <- g + geom_jitter(shape = symbols, aes(text = sprintf("<br>Treatment: %s<br>Batch: %s<br>Line Index: %s", df[[colTreatment]], df[[colBatch]], df$lineIndex), color = plotColors ), position = position_jitter(w = jitterX, h = jitterY)) +
                 scale_color_manual(values=plotColors) + 
                 theme(legend.position="none")
        
    }
    
    
    # Customize plot
    if(splitBy != "None"){
        g <- g + 
            facet_grid( as.formula(paste("~", splitBy)), scales = "free_x" ) + 
            theme( strip.text.x = element_text( angle = 90 ) )
    }
    
    # Output finished plot
    ggplotly( g )
}

# Generate Plotly boxplot
boxPlot <- function(df, batch, x, y, col_QC, highlightCenter = "No", splitBy = "None", colTreatment, colBatch  ){


    # Make plot
    g <- ggplot( df, aes_string( paste0( "`", x,"`" ), paste0( "`", y,"`" ) ) )
    g <- g + geom_boxplot() + ggtitle( batch )
    
    # Customize plot
    if(highlightCenter != "No"){
        g <- switch(highlightCenter,
                    "Mean"   = g + stat_summary(fun.y = "mean",   colour = "red", size = 4, geom = "point", alpha = 0.5),
                    "Median" = g + stat_summary(fun.y = "median", colour = "red", size = 4, geom = "point", alpha = 0.5)
        )
    }
    if(splitBy != "None"){
        g <- g + 
            facet_grid(as.formula(paste("~", splitBy)), scales = "free_x") + 
            theme(strip.text.x = element_text(angle = 90))
    }
    
    # Output finished plot
    ggplotly(g)
}

# Generate Plotly heatmap
heatmapPlot <- function( df, measurement, batch, nrows, ncolumns, symbolsize=1, col_QC, highlightQCfailed, colorMin = -Inf, colorMax = +Inf, lutColors = "Blue-White-Red", colTreatment, colBatch ){
    
    # Initialize variables
    df$lineIndex <- 1:nrow(df)
    plotSymbols <- c(approved = 15, rejected = 4)

    print( paste("Selected lutColors:", lutColors) )

    if ( is.null( lutColors ))
    {
        colorGrad   <- c("blue", "white", "red")
    }
    else
    {
        if ( lutColors == "Blue-White-Red" )
        {
            colorGrad   <- c("blue", "white", "red")
        }
        else if ( lutColors == "Red-White-Green" )
        {
            colorGrad   <- c("red2", "white", "green4")
        }
        else
        {
            colorGrad   <- c("blue", "white", "red")
        }
    }

    print( paste0( "colorMin ", colorMin ) )
    print( paste0( "colorMax ", colorMax ) )

    # Column 'LUT' has numeric values which are solely used for the color lookup table
    df$LUT <- sapply(df[[measurement]], function(f){
        if(is.na(f)) return(f)
        if(f <= colorMin) return(colorMin)
        if(f >= colorMax) return(colorMax)
        f
    })
    
    # Define the data to be plotted
    g <- ggplot( df, 
                 aes( heatX, heatY, color = LUT, 
                      text = sprintf("%s: %s<br>Treatment: %s<br>Batch: %s<br>Line Index: %s", measurement, df[[measurement]], df[[colTreatment]], df[[colBatch]], df$lineIndex)
                 ) 
    )
    
    # Calculate the symbol to be used at each data point
    symbols <- if( highlightQCfailed == "Show with cross")
    {
        sapply( df[[col_QC]], function(x) ifelse(x, plotSymbols["approved"], plotSymbols["rejected"]))
    } 
    else
    {
        plotSymbols["approved"]
    }
    
    
    # Other plot settings
    g <- g + geom_point(size=symbolsize, shape=symbols) + 
        scale_colour_gradientn(colors = colorGrad) + 
        ggtitle(batch) + 
        theme(panel.grid = element_blank()) +
        scale_x_continuous(breaks = 1:ncolumns) +
        scale_y_continuous(breaks = 1:nrows, labels = LETTERS[nrows:1]) + 
        theme(axis.title.x=element_blank(), axis.title.y=element_blank())
    
    
    # Output finished plot
    ggplotly( g )
    
}

# Can open multiple files at once
# filePath is an array of character strings
OpenInFiji <- function( directories, filenames, fijiBinaryPath = "C:\\Fiji.app\\ImageJ-win64.exe", x, y, z, stackName = "composite" )
{
    num_images = length( directories );  
    
    import_image_sequence_reg_exp_template = "IJ.run(\"Image Sequence...\", \"open=[DIRECTORY] file=(REGEXP) sort\");";
    open_image_template = "IJ.open(\"DIRECTORY/FILENAME\");";
    
    # init
    commands <- "import ij.IJ;\n"
    commands <- paste0( commands, "import ij.ImagePlus;", "\n" );
    commands <- paste0( commands, "import ij.gui.OvalRoi;", "\n" );
    
    # Generate the expression opening each image
    for ( i in seq(1, num_images) )
    {
        if( grepl("\\?", filenames[ i ] ) )
        {
            # directory
            import_image_sequence_reg_exp <- sub( "DIRECTORY", directories[ i ], import_image_sequence_reg_exp_template, fixed = TRUE )
            
            # filename / regexp
            reg_exp = gsub( "\\", "\\\\", filenames[ i ], fixed = TRUE )
            import_image_sequence_reg_exp <- sub( "REGEXP", reg_exp, import_image_sequence_reg_exp, fixed = TRUE )
            
            commands <- paste0( commands, import_image_sequence_reg_exp, "\n" );
        }
        else
        {
            open_image = sub( "DIRECTORY", directories[ i ], open_image_template, fixed = TRUE )
            open_image = sub( "FILENAME", filenames[ i ], open_image, fixed = TRUE )
            commands <- paste0( commands, open_image, "\n" )
        }
        
        if ( grepl( "LabelMask", filenames[ i ], ignore.case = TRUE ) )
        {
            set_label_mask_lut = "IJ.run(\"glasbey inverted\", \"\");";
            commands <- paste0( commands, set_label_mask_lut, "\n" )
            # IJ.run("16-bit", "");
        }
        
        get_imp = paste0( "ImagePlus imp", i, " = IJ.getImage(); ");
        commands <- paste0( commands, get_imp, "\n" )
        
    }
    
    # When opening more than 1 image: additional post-processing required
    
    if ( num_images > 1 & num_images <= 7 )
    {
        # Create composite image. ImageJ supports up to 7 channels.
        # merge_channels = "IJ.run(imp1, \"Merge Channels...\", \"c1=\"+imp1.getTitle()+\" c2=\"+imp2.getTitle()+\" create\");"
        merge_channels = paste0("IJ.run(imp1, \"Merge Channels...\", ",
                                paste0(
                                    sapply(1:num_images, function(x) paste0("\"c", x, "=\"+imp", x, ".getTitle()")), collapse = "+\" \"+"
                                ),
                                "+\" create\");")
        get_imp2     <- paste0( "ImagePlus imp = IJ.getImage(); ")
        rename_stack <- paste0("imp.setTitle(\"", stackName, "\");")
        
        commands <- paste0( commands, merge_channels, "\n" )
        commands <- paste0( commands, get_imp2, "\n" )
        commands <- paste0( commands, rename_stack, "\n" )
        commands <- paste0( commands, "IJ.wait( 100 );", "\n" ) # needs time to build the composite image
    }
    if ( num_images > 7 )
    {
        # Create stack
        make_stack = "IJ.run(imp1, \"Images to Stack\", \"name=Stack title=[] use\");"
        commands <- paste0( commands, make_stack, "\n" )
    }
    
    #
    # highlight object 
    #

    # set slice
    if ( ! is.null( z ) &&  z != "NA" )
    { 
        setSlice = paste0( "IJ.getImage().setPosition( 1 ,", ceiling( z ) ,", 1);" )
        commands <- paste0( commands, setSlice, "\n" );
    }
    
    # put ROI at object location
    if (! is.null( x ) && ! is.null( y ) && ( x != "NA" ) && ( y != "NA" ) )
    { 
        diameter = 50;
        x <- x - 25;
        y <- y - 25;
        setRoi = paste0( "IJ.getImage().setRoi( new OvalRoi(", x, "," , y, ",",diameter,",",diameter,") )");
        commands <- paste0( commands, setRoi, "\n" );
        addAsOverlay = paste0( "IJ.run (IJ.getImage(), \"Add Selection...\", \"\")" );
        commands <- paste0( commands, addAsOverlay, "\n" );
    }
    
    #
    # write commands to groovy script    
    #
    
    tmp_directory = paste0( getwd(), "/tmp" ) 
    dir.create( tmp_directory, showWarnings = FALSE )
    tmp_groovy_script = paste0( tmp_directory, "/openImages.groovy" );
    write( commands, file = tmp_groovy_script) ;
    
    system_cmd = paste( fijiBinaryPath, '--run', paste0( '\"', tmp_groovy_script, '\"') );
    
    # print groovy commands for user info and debugging
    print( commands )
    
    # print command for user info and debugging
    print( system_cmd )
    
    # Evoke Fiji with the expression compiled above
    system( system_cmd, wait = FALSE )
}

# Generate coordinates for heatmap
generateHeatmapCoordinates <- function(WellX, WellY, PosX, PosY, subposjitter = 0.2){
    
    numWells <- WellX * WellY
    numSubpos <- PosX * PosY
    
    # Map well numbers to a plate layout
    wellLayout <- matrix(1:numWells, WellY, WellX, byrow = TRUE, dimnames = list(LETTERS[1:WellY], 1:WellX))
    
    # (x,y) coordinates for all well centers
    WellCenters <- data.frame(wellnum = integer(), X = integer(), Y = integer())
    for (i in 1:WellY){
        for (j in 1:WellX){
            temp <- which(wellLayout == wellLayout[i,j], arr.ind=TRUE)
            WellCenters <- rbind(WellCenters, 
                                 data.frame(wellnum = wellLayout[i,j], X = temp[1,"col"], Y = -temp[1,"row"]+WellY+1)
            )
        }
    }
    
    # Map subposition array
    posLayout <- matrix(1:numSubpos, PosY, PosX, byrow = TRUE, dimnames = list(LETTERS[1:PosY], 1:PosX))
    
    # (x,y) coordinates for each subposition cluster.
    PosCenters <- data.frame(posnum = integer(), X = numeric(), Y = numeric())
    for (u in 1:PosY){
        for (v in 1:PosX){
            temp <- which(posLayout == posLayout[u,v], arr.ind=TRUE)
            PosCenters <- rbind(PosCenters, 
                                data.frame(posnum = posLayout[u,v], X = temp[1,"col"]-0.5-PosX/2, Y = -temp[1,"row"]+PosY/2+0.5)
            )
        }
    }
    PosCenters[, c("X", "Y")] <- PosCenters[, c("X", "Y")] * subposjitter
    
    
    # (x,y) coordinates for all images in a plate
    temp <- data.frame(wellnum = integer(), posnum = integer(), X = numeric(), Y = numeric())
    for(w in 1:numWells){
        
        localcenter <- do.call("rbind", replicate(numSubpos, WellCenters[w,], simplify = FALSE))
        localcenter$posnum <- PosCenters$posnum
        localcenter$X <- localcenter$X + PosCenters$X
        localcenter$Y <- localcenter$Y + PosCenters$Y
        
        temp <- rbind(temp, localcenter)
    }
    
    temp <- temp[, c("wellnum", "posnum", "X", "Y")]
    row.names(temp) <- NULL
    temp
}

# Creates a 1-batch data.frame with all additional data required for a
makeHeatmapDataFrame <- function(df, WellX, WellY, PosX, PosY, subposjitter = 0.2, batch_col, batch, col_Well, col_Pos, col_QC = "HTM_QC"){
    
    if(batch == "All batches") return(NULL)
    
    # Subset data frame
    df <- df[df[[batch_col]] == batch,]
    
    # Calculate coordinates for heatmap
    dfCoords <- generateHeatmapCoordinates(WellX, WellY, PosX, PosY, subposjitter)
    
    # Add heatmap coordinates
    for(i in 1:nrow(df)){
        w  <- df[i,col_Well]
        p  <- df[i,col_Pos]
        xy <- dfCoords[dfCoords$wellnum == w & dfCoords$posnum == p, c("X", "Y")]
        
        df[i, "heatX"] <- xy[1,"X"]
        df[i, "heatY"] <- xy[1,"Y"]
    }
    
    df
}


# Apply QC
applyQC <- function(df, dfQC){
    
    # This an example of how the 'dfQC' data.frame needs to look like
    # 'measurement' is the name of one of the columns in 'df'
    # All values in 'df' are text
    # dfQC <- data.frame(type = c("Numeric QC", "Numeric QC", "Text QC", "Failed experiment"), measurement = c("Count_cell_all", "Count_cell_final", "FileName_PM", "Metadata_platePath"), minimum = c("50", "20", "image1.tif", "myplate_01"), maximum = c("500", "100", "image1.tif", "myplate_01"), stringsAsFactors = FALSE)
    
    # Make sure the data frame only contains character variables (no factors wanted!)
    dfQC[] <- lapply(dfQC, as.character)
    
    apply(df, 1, function(x){
        
        QCoverall <- NULL
        for(i in 1:nrow(dfQC)){
            
            testvalue <- x[dfQC[i, "measurement"]]
            if(is.na(testvalue)){                   # Make sure "NA" is correctly interpreted
                testvalue <- "NA"}
            if(is.nan(testvalue)){                  # Make sure "NaN" is correctly interpreted
                testvalue <- "NaN"}
            
            temp <- switch (as.character(dfQC[i,"type"]),
                            "Numeric QC"        = if(is.na(testvalue)){
                                FALSE
                            } else{
                                as.numeric(testvalue) >= as.numeric(dfQC[i, "minimum"]) & as.numeric(testvalue) <= as.numeric(dfQC[i, "maximum"])
                            },
                            "Text QC"           = testvalue != dfQC[i, "minimum"],
                            "Failed experiment" = testvalue != dfQC[i, "minimum"]
            )
            
            QCoverall <- c(QCoverall, temp)
        }
        
        all(QCoverall)
    })
    
}


#####################################################
################ From HTM-Explorer (below) ##########
#####################################################

#
# Normalization
#

htmNormalization <- function(
    data, measurements, col_Experiment, transformation, gradient_correction, normalisation,
negcontrol, col_QC, col_Well, col_Treatment, num_WellX = 0, num_WellY = 0) {
    
    echo("*")
    echo("* Data normalization")
    echo("*")
    echo("")
    
    
    # remove previously computed columns
    drops = names(data)[which(grepl("HTM_norm", names(data)))]
    data <- data[ ,!(names(data) %in% drops)]
    
    
    # get all necessary information
    measurements        <- sort(measurements)
    experiments         <- sort(unique(data[[col_Experiment]]))
    gradient_correction <- gsub("-", "_", gradient_correction)        # The dash character '-' is mishandled by the selectInput widgets of shiny
    normalisation       <- gsub("-", "_", normalisation)              # The dash character '-' is mishandled by the selectInput widgets of shiny
    #    transformation      <- transformation
    #    negcontrol          <- negcontrol
    
    
    # compute
    for (measurement in measurements) {
        
        echo("Measurement:")
        echo("     ", measurement)
        echo("Negative Control:")
        echo("     ", negcontrol)
        
        #
        # Check           
        #
        if( ! (measurement %in% names(data)) ) {
            cat(names(data))
            cat("\nError: selected measurement does exist in data columns!\n")
            return(data)
        }
        
        #
        # Analyze
        #
        
        manipulation <- "__"
        input <- measurement
        
        # Log2
        if(transformation == "log2") {
            
            echo("")
            echo("Log2:")
            echo("  Input: ", input)
            
            # compute log transformation
            # create new column name
            manipulation <- paste0(manipulation,"log2__")
            
            output = paste0("HTM_norm",manipulation,measurement)
            
            idsGtZero <- which(data[[input]]>0)
            idsSmEqZero <- which(data[[input]]<=0)
            data[idsGtZero,output] <- log2(data[idsGtZero,input]) 
            data[idsSmEqZero,output] <- NaN
            echo("  Output: ", output)
            echo("  Number of data points: ", length(data[[input]]))
            echo("  NaN's due to <=0: ", length(idsSmEqZero))
            
            # todo: this should be at a more prominent position
            #print("Replacing -Inf in log scores ******************************")
            #logScores = data[[output]]
            #finiteLogScores = subset(logScores,is.finite(logScores))
            #minimum = min(finiteLogScores)
            #idsInf = which(is.infinite(logScores))
            #logScores[idsInf] <- minimum
            #data[[output]] <- logScores
            
            #htmAddLog("Replacing Infinities in Log2 Score by")
            #htmAddLog(minimum)
            #htmAddLog("Affected Wells:")
            #for(id in idsInf) {
            #  htmAddLog(htm@wellSummary$treatment[id])
            #  htmAddLog(htm@wellSummary$wellQC[id])
            #  htmAddLog(htm@wellSummary[id,logScoreName])
            #  htmAddLog("")
            #}
            
            input <- output
            
        } # if log transformation
        
        
        if(gradient_correction == "median polish") {
            
            echo("  median polish of ", input)
            
            # also store the background
            gradient = paste0("HTM_norm",paste0(manipulation,"__medpolish_gradient__"),measurement)
            
            manipulation <- paste0(manipulation,"__medpolish_residuals__")
            output = paste0("HTM_norm",manipulation,measurement)
            
            data[[output]] = rep(NA,nrow(data))
            
            for(experiment in experiments) {
                
                echo("")
                echo("  Experiment: ",experiment)
                
                indices_all <- which((data[[col_Experiment]] == experiment))
                #indices_ok <- which((data[[col_Experiment]] == experiment) & (data[[col_QC]]) & !is.na(data[[input]]))
                
                # extract values
                xy = htm_convert_wellNum_to_xy(data[indices_all, col_Well], num_WellX, num_WellY) 
                mp = htmMedpolish(xx=xy$x, yy=xy$y, val=data[indices_all, input], num_WellX, num_WellY)
                
                data[indices_all, output] = mp$residuals
                data[indices_all, gradient] = mp$gradient
                
            } # experiment loop
            
            input <- output
            
        } #medpolish
        
        
        if( gradient_correction %in% c("median 7x7","median 5x5","median 3x3")) {
            
            echo("  median filter of ", input)
            
            gradient = paste0("HTM_norm",paste0(manipulation,"__",gradient_correction,"__gradient__"),measurement)
            manipulation <- paste0(manipulation,"__",gradient_correction,"__residuals__")
            output = paste0("HTM_norm",manipulation,measurement)
            
            data[[output]] = rep(NA,nrow(data))
            
            for(experiment in experiments) {
                
                echo("  Experiment: ", experiment)
                
                indices_all <- which((data[[col_Experiment]] == experiment))
                indices_ok  <- which((data[[col_Experiment]] == experiment) & (data[[col_QC]]) & !is.na(data[[input]]))
                
                xy = htm_convert_wellNum_to_xy(data[indices_ok, col_Well], num_WellX, num_WellY) 
                
                if(gradient_correction == "median 7x7") {
                    mp = htmLocalMedian(xx=xy$x, yy=xy$y, val=data[indices_ok, input], size=7, num_WellX, num_WellY)
                }
                if(gradient_correction == "median 5x5") {
                    mp = htmLocalMedian(xx=xy$x, yy=xy$y, val=data[indices_ok, input], size=5, num_WellX, num_WellY)
                }
                if(gradient_correction == "median 3x3") {
                    mp = htmLocalMedian(xx=xy$x, yy=xy$y, val=data[indices_ok, input], size=3, num_WellX, num_WellY)
                }
                
                data[indices_ok, output] = mp$residuals
                data[indices_ok, gradient] = mp$gradient
                
            } # experiment loop
            
            input <- output
            
        } #median filter
        
        
        if( gradient_correction %in% c("z_score 5x5")) {
            # Mean = E(X)
            # Variance = E(X^2)-E(X)^2
            # Z-Score = (Xi - E(X)) / Sqrt(E(X^2)-E(X)^2)
            
            echo("  5x5 z-score filter of ", input)
            
            # also store the background
            standard_deviation = paste0("HTM_norm",paste0(manipulation,"__5x5_standard_deviation__"),measurement)
            mean_value = paste0("HTM_norm",paste0(manipulation,"__5x5_mean__"),measurement)
            manipulation <- paste0(manipulation,"__5x5_z_score__")
            output = paste0("HTM_norm",manipulation,measurement)
            
            data[[output]] = rep(NA,nrow(data))
            data[[standard_deviation]] = rep(NA,nrow(data))
            data[[mean_value]] = rep(NA,nrow(data))
            
            for(experiment in experiments) {
                
                echo("  Experiment: ", experiment)
                
                indices_all <- which((data[[col_Experiment]] == experiment))
                xy = htm_convert_wellNum_to_xy(data[indices_all, col_Well], num_WellX, num_WellY) 
                
                mp = htmLocalZScore(xx=xy$x, yy=xy$y, val=data[indices_all, input], size=5, num_WellX, num_WellY)
                
                data[indices_all, mean_value] = mp$avg
                data[indices_all, standard_deviation] = mp$sd
                data[indices_all, output] = mp$z
                
                
            } # experiment loop
            
            input <- output
            
        } #median filter
        
        
        if(normalisation != "None selected") {
            
            echo("")
            echo("Per batch normalisation:")
            echo("  Method: ", normalisation)
            echo("  Input: ", input)
            
            # init columns
            manipulation <- paste0(manipulation,normalisation,"__")
            output = paste0("HTM_norm",manipulation,measurement)
            output <- gsub(" ", "_", output)
            data[[output]] = NA
            echo("  Output: ",output)
            
            # computation
            #cat("\nComputing normalisations...\n")
            
            for(experiment in experiments) {
                
                #print("")
                #print(paste("  Experiment:",experiment))
                
                indices_all <- which((data[[col_Experiment]] == experiment))
                indices_ok  <- which((data[[col_Experiment]] == experiment) & (data[[col_QC]]) & !is.na(data[[input]]))
                
                if("All treatments" %in% negcontrol) {
                    indices_controls_ok <- indices_ok
                } else {
                    indices_controls_ok <- which((data[[col_Experiment]] == experiment) 
                                                 & !is.na(data[[input]]) 
                                                 & (data[[col_QC]]) 
                                                 & (data[[col_Treatment]] %in% negcontrol))
                }
                
                #print(paste("   Total", length(indices_all)))
                #print(paste("   Valid", length(indices_ok)))      
                #print(paste("   Valid Control", length(indices_controls_ok)))
                
                # extract control values 
                valuescontrol <- data[indices_controls_ok, input]
                #print(valuescontrol)
                
                nr_of_controls <- length(valuescontrol)
                meancontrol    <- mean(valuescontrol)    
                sigmacontrol   <- sd(valuescontrol) 
                mediancontrol  <- median(valuescontrol)
                madcontrol     <- mad(valuescontrol)  
                semcontrol     <- sigmacontrol/sqrt(nr_of_controls)     
                #print(paste("    Control Mean:", meancontrol))
                #print(paste("    Control SD:", sigmacontrol))
                #print(paste("    Control Median:", mediancontrol))
                #print(paste("    Control MAD:", madcontrol))
                
                if(normalisation == "z_score") {
                    data[indices_all, output] <- ( data[indices_all, input] - meancontrol ) / sigmacontrol
                } 
                else if(normalisation == "z_score (median subtraction)") {
                    data[indices_all, output] <- ( data[indices_all, input] - mediancontrol ) / sigmacontrol
                }
                else if(normalisation == "robust z_score") {
                    data[indices_all, output] <- ( data[indices_all, input] - mediancontrol ) / madcontrol
                }
                else if(normalisation == "subtract mean ctrl") {
                    data[indices_all, output] <- data[indices_all, input] - meancontrol 
                }
                else if(normalisation == "divide by mean ctrl") {
                    data[indices_all, output] <- data[indices_all, input] / meancontrol 
                }
                else if(normalisation == "subtract median ctrl") {
                    data[indices_all, output] <- data[indices_all, input] - mediancontrol 
                }
                else if(normalisation == "divide by median ctrl") {
                    data[indices_all, output] <- data[indices_all, input] / mediancontrol 
                }
                
            } # experiment loop
            
            input <- output
            
        } # if normalisation
        
    } # measurement loop
    
    return(data)
    
}


#
# Spatial position related
#

htm_convert_wellNum_to_xy <- function(wellNum, plate.ncol, plate.nrow) {
    
    ### GET PLATE INFO
    plate.nwells = plate.nrow * plate.ncol
    
    ### intialise
    xx = vector(length=length(wellNum))
    yy = xx
    
    ### WELLS  
    plate.wellNumToRow = vector(length=plate.nwells);
    plate.wellNumToCol = vector(length=plate.nwells);
    iw = 1;
    for(ir in 1:plate.nrow) {
        for(ic in 1:plate.ncol) {
            plate.wellNumToRow[iw] = ir;
            plate.wellNumToCol[iw] = ic;
            iw=iw+1;
        }  
    }
    
    
    ## return
    
    list(y = plate.wellNumToRow[wellNum],
         x = plate.wellNumToCol[wellNum])
    
    
}


#
# Local data normalisation
#

htmMedpolish <- function(xx, yy, val, num_PosX, num_PosY) {
    
    
    # averaging for multi-sub-positions?
    m = matrix(nrow=num_PosX,ncol=num_PosY)        # from Hugo to Tischi: aren't the xy coordinates flipped?
    mi = m 
    for(i in seq(1:length(val))) {
        #print(paste(xx[i],yy[i],val[i]))
        m[xx[i],yy[i]] <- val[i]
        mi[xx[i],yy[i]] <- i # remember where the data belongs in the original format
    }
    #print("raw"); dev.new(); image(m, col=gray((0:32)/32))
    
    med = medpolish(m, maxiter = 100, na.rm = T)
    m_gradient <-  med$overall + outer(med$row,med$col, "+")
    m_residuals <- m - m_gradient
    
    #print("gradient"); dev.new(); image(m_gradient, col=gray((0:32)/32))
    #print("residuals"); dev.new(); image(m_residuals, col=gray((0:32)/32))
    
    # covert back
    val_gradient = vector(length=length(val))
    val_residual = vector(length=length(val))
    for(i in seq(1:length(val))) {
        val_gradient[mi[xx[i],yy[i]]] = m_gradient[xx[i],yy[i]]
        val_residual[mi[xx[i],yy[i]]] = m[xx[i],yy[i]] - m_gradient[xx[i],yy[i]] 
    }
    
    list(gradient = val_gradient,
         residuals = val_residual)
}

htmLocalMedian <- function(xx, yy, val, size, num_PosX, num_PosY) {
    
    echo("  median filter with size ", size)
    
    
    x <- htmXYVtoMatrix(xx, yy, val, num_PosX, num_PosY) # averaging for multi-sub-positions?
    m <- x$m
    
    m_gradient  <- as.matrix(focal(raster(m), matrix(1, size, size), function(z) median(z, na.rm=T), pad = T, padValue = NA))
    m_residuals <- m - m_gradient
    
    list(gradient  = htmMatrixToXYV(xx, yy, m_gradient, x$mi),
         residuals = htmMatrixToXYV(xx, yy, m_residuals, x$mi))
}

htmLocalZScore <- function(xx, yy, val, size, num_PosX, num_PosY) {
    
    echo("  local z_score filter with size ", size)
    
    
    x <- htmXYVtoMatrix(xx, yy, val, num_PosX, num_PosY) # averaging for multi-sub-positions?
    m <- x$m
    
    m_mean <- as.matrix(focal(raster(m), matrix(1, size, size), function(z) mean(z, na.rm=T), pad = T, padValue = NA))
    m_meansqr <- as.matrix(focal(raster(m^2), matrix(1, size, size), function(z) mean(z, na.rm=T), pad = T, padValue = NA))
    m_sd = sqrt( m_meansqr - m_mean^2 )
    m_z = (m - m_mean) / m_sd
    
    #print("before")
    #print(m[1:10,1:6])
    #print("avg")
    #print(m_mean[1:10,1:6])
    #print("sd")
    #print(m_sd[1:10,1:6])
    #print("z")
    #print(m_z[1:10,1:6])
    #ddd
    
    list(avg = htmMatrixToXYV(xx, yy, m_mean, x$mi),
         sd  = htmMatrixToXYV(xx, yy, m_sd, x$mi),
         z   = htmMatrixToXYV(xx, yy, m_z, x$mi))
}

htmXYVtoMatrix <- function(xx, yy, val, num_PosX, num_PosY) {
    m = matrix(nrow=num_PosY, ncol=num_PosX)
    mi = m 
    for(i in seq(1:length(val))) {
        m[yy[i],xx[i]] <- val[i]
        mi[yy[i],xx[i]] <- i # remember where the data belongs in the original format
    }
    return(list(m = m, mi = mi))
}

htmMatrixToXYV <- function(xx, yy, m, mi) {
    val = vector(length=length(xx))
    for(i in seq(1:length(xx))) {
        val[mi[yy[i],xx[i]]] = m[yy[i],xx[i]]
    }
    return(val)
}


#
# Treatment Summary
#

htmTreatmentSummary <- function(data, measurements, col_Experiment, col_Treatment, col_ObjectCount, col_QC, negative_ctrl, positive_ctrl, excluded_Experiments) {

    echo("")
    echo("Treatment Summary:")
    echo("******************")
    echo("")
    
    # get all necessary information
    experiments <- sort(unique(data[[col_Experiment]]))
    experiments <- experiments[!experiments %in% excluded_Experiments]
    treatments  <- sort(unique(data[[col_Treatment]]))
    
    
    # output
    echo(""); echo("Experiments:")
    for(experiment in experiments)
    {
        echo(""); echo(experiment)
    }
    echo(experiments)
    echo(""); echo("Number of treatments: ", length(treatments))
    echo(""); echo("Negative control: ", negative_ctrl)
    echo(""); echo("Positive control: ", positive_ctrl)
    echo(""); echo("Measurements: ", measurements)
    echo(""); echo("")

    if(!all(sapply(measurements, function(x) x %in% names(data)))) {
        echo("ERROR: measurement ", measurement, " does not exist in data")
        return(0)
    }
    if(!(col_ObjectCount %in% names(data))) {
        echo("ERROR: object count ", col_ObjectCount, " does not exist in data")
        return(0)
    }
    
    
    numTreatments = length(treatments)

    results <- data.frame(measurement      = rep(NA, numTreatments),
                          controls         = rep(negative_ctrl, numTreatments),
                          treatment        = rep(NA, numTreatments),
                          batches          = rep(NA, numTreatments),
                          means            = rep(NA, numTreatments),
                          median__means    = rep(NA, numTreatments),

                          t_test__estimate = rep(NA,numTreatments),
                          t_test__p_value  = rep(NA,numTreatments),
                          t_test__p_value_adjusted  = rep(NA,numTreatments),
                          t_test__signCode = rep(NA,numTreatments),

                          mean_number_of_objects_per_image=rep(NA,numTreatments),
                         
                          numObjectsOK     = rep(NA,numTreatments),
                          numImagesOK      = rep(NA,numTreatments), 
                          numReplicatesOK  = rep(NA,numTreatments),
                          #numPositionsOK=rep(NA,numTreatments),
                          #numPositions=rep(NA,numTreatments),
                          stringsAsFactors = FALSE
    )
    results <- lapply(measurements, function(x){
        results$measurement <- x
        results
    })
    names(results) <- measurements
    
    
    ###################################
    # Compute stats
    ###################################
    
    echo("Computing statistics...")

    for(measurement in measurements){

        echo("***********************************************************************")
        echo("Measurement: ", measurement)

        # Select negative controls
        ids_negctrl <- if(negative_ctrl == "All treatments"){
            which(data[[col_QC]]==1 & !(data[[col_Experiment]] %in% excluded_Experiments) & !is.na(data[[measurement]]))
        } else{
            which(data[[col_QC]]==1 & !(data[[col_Experiment]] %in% excluded_Experiments) & !is.na(data[[measurement]]) & data[[col_Treatment]] %in% negative_ctrl)
        }
        
        i <- 0
         
        for(treatment in treatments) {
            
            # ********************************
            # T-test  
            # ********************************
            
            ids_treatment = (1:nrow(data))[data[[col_Treatment]] == treatment]
            
            # init
            t_test__p_value  = NA
            t_test__signCode = NA
            t_test__estimate = NA
            z_scores         = NA
            median__z_scores = NA
            median__means    = NA
            means            = NA
            batches          = NA
            d = data.frame(value=NA, treatment=NA, experiment=NA)
            
            # compute
            # only keep valid treatment values to find the corresponding experiments
            ids    <- ids_treatment[which(data[ids_treatment,col_QC]==1 & !(data[ids_treatment, col_Experiment] %in% excluded_Experiments) & !is.na(data[ids_treatment,measurement]))]
            ids_ok <- c(ids, ids_negctrl)
            exps   <- unique(data[ids,col_Experiment])
                
                # extract treatment and control values of the respective experiments
                d <- subset(data[ids_ok,], 
                            (data[ids_ok, col_Experiment] %in% exps), 
                            select = c(col_Treatment,measurement,col_Experiment,col_ObjectCount))
                
                names(d)[names(d)==measurement]     <- "value"
                names(d)[names(d)==col_Treatment]   <- "treatment"
                names(d)[names(d)==col_Experiment]  <- "experiment"
                names(d)[names(d)==col_ObjectCount] <- "count"
                
                d[1:length(ids), "treatment"] <- treatment
                d[(length(ids)+1):(length(ids)+length(ids_negctrl)), "treatment"] <- "control"
                
                
                if ( (sum(d$treatment=="control")>1) & (sum(d$treatment==treatment)>1) ) {
                    
                    d$treatment <- as.factor(d$treatment)
                    d$treatment <- relevel( d$treatment, "control" ) # control must be the 1st level for the linear model
                    t <- t.test(d$value ~ d$treatment)  # as there typically is enough data no equal variance is assumed
                    
                    nBlocks = length(unique(d$experiment)) 
                    n = nrow(d)
                    
                    t_test__p_value  <- 2 - 2 * pt( abs(t$statistic), df = n - (nBlocks-1) - 2 )
                    t_test__estimate <- t$estimate[2]
    
                }
                
                if ( (sum(d$treatment=="control")>=1) & (sum(d$treatment==treatment)>=1) ) {
                    
                    d_ctrl = d[d$treatment=="control",]
                    means_ctrl <- tapply(d_ctrl$value, d_ctrl$experiment, mean)
                    sds_ctrl <- tapply(d_ctrl$value, d_ctrl$experiment, sd)
                    
                    d_treat = d[d$treatment==treatment,]
                    means_treat <- tapply(d_treat$value, d_treat$experiment, mean)
                    
                    tryCatch(z_scores <- (means_treat - means_ctrl) / sds_ctrl
                             , error = function(e) {
                                 echo(d)
                                 echo(treatment)
                                 echo(means_treat)
                                 echo(negative_ctrl)
                                 echo(means_ctrl)
                                 #print(sds_ctrl)
                                 echo(z_scores)
                                 echo(ids)
                                 echo(idsOld)
                                 echo(data[ids,])
                                 echo(data[idsOld,])
                                 echo(e)
                                 
                                 
                                 ddd
                             })
                    
                    median__z_scores = median(z_scores)
                    
                    z_scores = paste(round(z_scores,2),collapse=";")
                    
                }
                
                #print(d)
                #print(treat)
                #print(means_treat)
                #print(negative_ctrl)
                #print(means_ctrl)
                #print(sds_ctrl)
                #print(z_scores)
                #ddd        
                
                
            # select treatment for debugging
            if(!(treatment %in% negative_ctrl)) {
                d_treated = d[d$treatment==treatment,]
            } else {
                d_treated = d[d$treatment=="control",]
            }
            
            
            # these  values need no negative control, that's why they are outside of above if-statement
            means_treated <- tapply(d_treated$value, d_treated$experiment, mean)
            batches       <- paste(names(means_treated),collapse=";")
            means         <- paste(round(means_treated,3),collapse=";")
            median__means <- median(means_treated)
            
            
            i = i + 1
            results[[measurement]]$treatment[i] <- treatment
            results[[measurement]]$batches[i] = batches
            results[[measurement]]$means[i] = means
            results[[measurement]]$median__means[i] = median__means
            results[[measurement]]$t_test__p_value[i] = t_test__p_value
            results[[measurement]]$t_test__p_value_adjusted[i] = NA # this will be computed below after the treatment loop
            results[[measurement]]$t_test__signCode[i] = NA # this will be computed below after the treatment loop
            results[[measurement]]$t_test__estimate[i] = t_test__estimate
            #results[[measurement]]$z_scores[i] = z_scores
            #results[[measurement]]$median__z_scores[i] = median__z_scores
            results[[measurement]]$numObjectsOK[i] = sum(d_treated$count)
            results[[measurement]]$numImagesOK[i] = nrow(d_treated)
            results[[measurement]]$numReplicatesOK[i]= length(unique(d_treated$experiment))
            results[[measurement]]$mean_number_of_objects_per_image[i] = results[[measurement]]$numObjectsOK[i]/results[[measurement]]$numImagesOK[i]
            
            
        }  # treatment loop   
    
    
        #
        # Adjust p-values
        #
        # FDR = False discovery rate = FP / (FP + TP)
        #   TP + FP = total number of "hits"
        # FP = False positive
        # TP = True positive
        #
        # BH adjustment method:
        # - say we have M measurements
        # - sort all the p-values
        # - multiply the p-values with M/K, where the K is the rank in the ordering
        #       - that means that the lowest p-value will be multiplied with M/1, the 2nd lowest with M/2, a.s.o.
        #
        # - after this adjustment a p-value threshold of 0.05 means that the FDR is 0.05
        # - in other words: the probability that a hit is a false positive is 0.05
        #
        # Literature:
        # - http://varianceexplained.org/statistics/interpreting-pvalue-histogram/
        #
        #
    

        results[[measurement]]$t_test__p_value_adjusted = p.adjust(results[[measurement]]$t_test__p_value, method = "BH")
        
        results[[measurement]]$t_test__signCode <- ifelse(results[[measurement]]$t_test__p_value_adjusted<0.001,"***",
                                                   ifelse(results[[measurement]]$t_test__p_value_adjusted<0.01,"**",
                                                   ifelse(results[[measurement]]$t_test__p_value_adjusted<0.05,"*",
                                                   ifelse(results[[measurement]]$t_test__p_value_adjusted<0.1,".",
                                                   " "
                                                         ))))

        echo("")
        echo("Done for measurement '", measurement, "'. Created Treatment Summary Table.")
        
        
        # Diagnostics 
        
        #hist(res)
        #dev.new()
        #qqnorm(res)
        #qqline(res)
        #print(wellScoreForANOVA)
        
        # display controls plot: raw well scores
        #print("Plot control scores...")
        #htmJitterplot(htm, cx="experiment", cy=well_raw_score, .ylab=well_raw_score, datatype="wells", 
        #              treatmentSubset = htmGetListSetting(htm,"statistics","negativeControl"),
        #              showMedian = F, showMean = T)
        
        # display controls plot: batch corrected well scores
        #print("Plot batch corrected control scores...")
        #htmJitterplot(htm, cx="experiment", cy=wellMinusMeanCtrlScores, .ylab=wellMinusMeanCtrlScores, datatype="wells", 
        #              treatmentSubset = htmGetListSetting(htm,"statistics","negativeControl"),
        #              showMedian = F, showMean = T)
        
        
        # save controls plot
        #  htmJitterplot(htm, cx="experiment", cy=wellScoreForANOVA, .ylab=wellScoreForANOVA, datatype="wells", 
        #                treatmentSubset = htmGetListSetting(htm,"statistics","negativeControl"),
        #                showMedian = F, showMean = T, save2file = T, newdev = F)
        
        # save histogram as plot
        #  print(paste("histo:",wellMinusMeanCtrlScores))
        #  htmHisto(wellMinusMeanCtrlScores, datatype="wells", treatmentSubset = htmGetListSetting(htm,"statistics","negativeControl"), save2file=T)
        
        #htm@wellSummary$exp_treat = paste(htm@wellSummary$experiment,htm@wellSummary$treatment,sep="_")
        #edit(htm@wellSummary$exp_treat)
        #print(wellMinusMeanCtrlScores)
        # todo: plot only if makes sense
        #htmJitterplot(htm, cx="exp_treat", cy=wellMinusMeanCtrlScores, .ylab=wellMinusMeanCtrlScores, datatype="wells", 
        #                treatmentSubset = c(htmGetListSetting(htm,"statistics","negativeControl"),htmGetListSetting(htm,"statistics","positiveControl")),
        #                showMedian = F, showMean = T, save2file = F, newdev = F)
        
        
        #####
    
        if(positive_ctrl != "None selected") {
            
            echo("")
            echo("")
            echo("Checking positive and negative control separation in each batch:")
            echo("")
            echo("Measurement: ", measurement)
            echo("Positive control: ", positive_ctrl)
            echo("Negative control: ", negative_ctrl)
            echo("")
            
            z_scores = c()
            
            for(exp in experiments) {
                
                d <- subset(data, (data[[col_Experiment]]==exp) & (data[[col_QC]]==1) & !(is.na(data[[measurement]])), select = c(col_Treatment, measurement))
                names(d)[names(d) == measurement] <- "value"
                names(d)[names(d) == col_Treatment] <- "treatment"
                
                d_neg    <- subset(d,d$treatment == negative_ctrl)
                mean_neg <- mean(d_neg$value)
                sd_neg   <- sd(d_neg$value)
                n_neg    <- length(d_neg$value)
                
                d_pos    <- subset(d,d$treatment == positive_ctrl)
                mean_pos <- mean(d_pos$value)
                sd_pos   <- sd(d_pos$value)
                n_pos    <- length(d_pos$value)
                
                #print(paste(min_neg,max_neg,mean_pos,sd_pos))
                #probability_of_pos_outside_neg = 1 - integrate( function(x) {dnorm(x,mean=mean_pos,sd=sd_pos)}, min_neg, max_neg)$value
                z_score = (mean_pos-mean_neg) / sd_neg
                z_scores = c(z_scores, z_score)
                #t_value = (mean_pos-mean_neg) / sqrt(sd_pos^2+sd_neg^2)
                
                
                #print(paste0(exp,"  N_neg: ",n_neg,"  N_pos: ",n_pos,"  Probability: ",round(probability_of_pos_outside_neg,3))) #,"  t-value: ",t_value))
                #quality = ifelse(abs(z_score)<1,"XX",
                #                 ifelse(abs(z_score)<2,"X",""
                #                               ))
                quality = ""
                
                #if ( exp %in% excluded_Experiments ) {
                #    comment = "(Excluded)  " 
                #} else {
                comment = ""
                #}
                
                echo(comment, exp, "; N_neg: ", n_neg, "; N_pos: ", n_pos, "; mean z-score of positive controls: ", round(z_score,3), " ", quality) #,"  t-value: ",t_value))
                
            }
            
            echo("")
            echo("z-scores (N, mean, sd): ", length(z_scores), " ", mean(z_scores, na.rm=T), " ", sd(z_scores, na.rm=T))
            
        }
        
    }
    

    # sorted hit-list with significance level * ** ***
    # plot colored according to significance level
    # with hits marked as sign
    results_ordered <- lapply(results, function(df){
        df[order(df$t_test__p_value),]
    })
    results_ordered <- do.call(rbind, results_ordered)
    row.names(results_ordered) <- NULL
    
    results_ordered
}

getObjectPositionColumn <- function( names, axis )
{
    
    name = paste0( axis, "Centroid" )
    if ( name %in% names )   return ( name );
    
    return ( "NA" );
    
}