/src/R/nucleominer.R - NucleoMiner - Forge du Centre Blaise Pascal

root / src / R / nucleominer.R @ ec2936ea

Historique | Voir | Annoter | Télécharger (86,57 ko)

       # get_content = function(# Get content from cached
       # ### Acces to the cached content of a file via the global variable NM_CACHE. Load content in NM_CACHE if needed.
       # obj, ##<< The object that we want its content.
       # ... ##<< Parameters that will be passed to my_read
       # ) {
       #   UseMethod("get_content", obj)
       #   ### Returns the cached content of the current object.
       # }
+      #
       # get_content.default = structure( function(# Get content from cached
       # ### Acces to the cached content of a file via the global variable NM_CACHE. Load content in NM_CACHE if needed.
       # obj, ##<< The object that we want its content.
       # ... ##<< Parameters that will be passed to my_read
       # ) {
       #   if (inherits(try(NM_CACHE,TRUE), "try-error") || is.null(NM_CACHE)) {
       #     NM_CACHE <<- list()
       #   }
       #   if (is.null(NM_CACHE[[obj$filename]])) {
       #     print(paste("Loading file ",obj$filename, sep=""))
       #     tmp_content = my_read(obj, ...)
       #     print("affect it...")
       #     NM_CACHE[[obj$filename]] <<- tmp_content
       #     print("done.")
       #   }
       #   return(NM_CACHE[[obj$filename]])
       # ### Returns the cached content of the current object.
       # }, ex=function(){
       #   # Create a dataframe
       #   df = NULL
       #   df = dfadd(df, list(key1 = "value1", key2 = "value2"))
       #   df = dfadd(df, list(key1 = "value1'", key2 = "value3'"))
       #   # Dump it into tmp file
       #   write.table(df, file="/tmp/tmp.dump.table.tmp")
       #   # Load it into cache using feature.
       #   cached_content_object  = list(filename="/tmp/tmp.dump.table.tmp")
       #   class(cached_content_object) = "table"
       #   # First time it will be load into cache
       #   print(get_content(cached_content_object))
       #   # Second time not
       #   print(get_content(cached_content_object))
+      #
       # })
+      #
       # my_read = function(
       # ### Abstract my_read function.
       #   obj, ...) {
       #   UseMethod("my_read", obj)
       # }
+      #
       # my_read.default = function(
       # ### Default my_read function.
       #   obj, ...){
       #   stop(paste("ERROR, my_read is not defined for any Objects (file ", obj$filename," )", sep=""))
       # }
+      #
       # my_read.fasta = function(
       # ### my_read function for fasta files.
       #   obj, ...){
       #   # require(seqinr)
       #   return(read.fasta(obj$filename, ...))
       # }
+      #
       # my_read.table = function(
       # ### my_read function for table files.
       #   obj, ...){
       #   if (rev(unlist(strsplit(obj$filename, ".", fixed=TRUE)))[1] == "gz") {
       #     return(read.table(file=gzfile(obj$filename), ...))
       #   } else {
       #     return(read.table(file=obj$filename, ...))
       #   }
       # }
+      #
       # my_read.cvs = function(
       # ### my_read function for cvs files.
       #   obj, ...){
       #   return(read.csv(file=obj$filename, ...))
       # }
       FDR = structure(function#  False Discovery Rate
       ### From a vector x of independent p-values, extract the cutoff corresponding to the specified FDR. See Benjamini & Hochberg 1995 paper
       ##author<< Gael Yvert,
+      (
       x, ##<< A vector x of independent p-values.
       FDR ##<< The specified FDR.
       ) {
         x <- sort(na.omit(x))
         N = length(x)
         i = 1;
         while(N*x[i]/i < FDR & i <= N) i = i + 1; # we search for the highest i where Nrandom / Nobserved < FDR
         if (i == 1)
           return (NA)
         else
           return( x[i-1] )
       ### Return the the corresponding cutoff.
       }, ex=function(){
         print("example")
       })
       llr_score_nvecs = structure(function # Likelihood ratio
       ### Compute the log likelihood ratio of two or more set of value.
+      (
         xs ##<< list of vectors.
       ) {
         l = length(xs)
         if (l < 1) {
           return(NA)
+        }
         if (l == 1) {
           return(1)
+        }
         sumllX = 0
         for (i in 1:l) {
           x = xs[[i]]
         	if (length(x) <= 1) {
         		return(NA)
+        	}
           meanX = mean(x)
           sdX = sd(x)
           llX = sum(log(dnorm(x,mean=meanX,sd=sdX)))
           sumllX = sumllX + llX
+        }
         meanXglo = mean(unlist(xs))
         sdXglo = sd(unlist(xs))
         llXYZ = sum(log(dnorm(unlist(xs),mean=meanXglo,sd=sdXglo)))
         ratio = sumllX - llXYZ
         return(ratio)
       ### Returns the log likelihood ratio.
       }, ex=function(){
         # LOD score for 2 set of values
         mean1=5; sd1=2; card2 = 250
         mean2=6; sd2=3; card1 = 200
         x1 = rnorm(card1, mean1, sd1)
         x2 = rnorm(card2, mean2, sd2)
         min = floor(min(c(x1,x2)))
         max = ceiling(max(c(x1,x2)))
         hist(c(x1,x2), xlim=c(min, max), breaks=min:max)
         lines(min:max,dnorm(min:max,mean1,sd1)*card1,col=2)
         lines(min:max,dnorm(min:max,mean2,sd2)*card2,col=3)
         lines(min:max,dnorm(min:max,mean(c(x1,x2)),sd(c(x1,x2)))*card2,col=4)
         llr_score_nvecs(list(x1,x2))
        })
       dfadd = structure(function# Adding list to a dataframe.
       ### Add a list \emph{l} to a dataframe \emph{df}. Create it if \emph{df} is \emph{NULL}. Return the dataframe \emph{df}.
       	(df, ##<<  A dataframe
       		l ##<<  A list
       	) {
         if (is.null(df)) {
           df = data.frame(l,stringsAsFactors=FALSE)
         } else {
           df = rbind(df, data.frame(l,stringsAsFactors=FALSE))
+        }
         return(df)
       ### Return the dataframe \emph{df}.
       }, ex=function(){
       		## Here dataframe is NULL
       		print(df)
       		df = NULL
       		# Initialize df
       		df = dfadd(df, list(key1 = "value1", key2 = "value2"))
       		print(df)
       		# Adding elements to df
       		df = dfadd(df, list(key1 = "value1'", key2 = "value2'"))
       		print(df)
       })
       sign_from_strand = function(
       ### Get the sign of strand
       strands) {
       	apply(t(strands), 2, function(strand) {	if (strand == "F") return(1) else return(-1)})
       ### If strand in forward then returns 1 else returns -1
+      }
       flat_reads = function(
       ### Extract reads coordinates from TempleteFilter input sequence
       reads, ##<< TemplateFilter input reads
       nuc_width ##<< Width used to shift F and R reads.
       ) {
       	F_flatted_reads = unlist(apply(t(reads[reads$V3=="F",]),2,function(r){rep(as.integer(r[2]), r[4])}))
       	R_flatted_reads = unlist(apply(t(reads[reads$V3=="R",]),2,function(r){rep(as.integer(r[2]), r[4])}))
       	flatted_reads = c(F_flatted_reads + rep(nuc_width/2, length(F_flatted_reads)), R_flatted_reads - rep(nuc_width/2, length(R_flatted_reads))  )
       	return(list(F_flatted_reads, R_flatted_reads, flatted_reads))
       ### Returns a list of F reads, R reads and joint/shifted F and R reads.
+      }
       filter_tf_outputs = function(# Filter TemplateFilter outputs
       ### This function filters TemplateFilter outputs according, not only genome area observerved properties, but also correlation and overlapping threshold.
       tf_outputs, ##<< TemplateFilter outputs.
       chr, ##<< Chromosome observed, here chr is an integer.
       x_min, ##<< Coordinate of the first bp observed.
       x_max, ##<< Coordinate of the last bp observed.
       nuc_width = 160, ##<< Nucleosome width.
       ol_bp = 59, ##<< Overlap Threshold.
       corr_thres = 0.5 ##<< Correlation threshold.
       ) {
         if (x_min < 0) {
           tf_outputs = tf_outputs[tf_outputs$chr == paste("chr", chr, sep="") & tf_outputs$center - tf_outputs$width/2 >= -x_max & tf_outputs$center + tf_outputs$width/2 <=  -x_min,]
       	} else {
           tf_outputs = tf_outputs[tf_outputs$chr == paste("chr", chr, sep="") & tf_outputs$center - tf_outputs$width/2 >= x_min & tf_outputs$center + tf_outputs$width/2 <= x_max,]
+        }
         tf_outputs$lower_bound = tf_outputs$center - tf_outputs$width/2
         tf_outputs$upper_bound = tf_outputs$center + tf_outputs$width/2
         tf_outputs = tf_outputs[tf_outputs$correlation.score >= corr_thres,]
         tf_outputs = tf_outputs[order(tf_outputs$correlation.score, decreasing=TRUE),]
         i = 1
         while (i <= length(tf_outputs[,1])) {
           lb = tf_outputs[i,]$lower_bound
           ub = tf_outputs[i,]$upper_bound
           tf_outputs = tf_outputs[!(tf_outputs$lower_bound <= (ub-ol_bp) & tf_outputs$upper_bound > ub) & !(tf_outputs$upper_bound >= (lb+ol_bp) & tf_outputs$lower_bound < lb),]
           i = i+1
+        }
         return(tf_outputs)
       ### Returns filtered TemplateFilter Outputs
+      }
       filter_tf_inputs = function(# Filter TemplateFilter inputs
       ### This function filters TemplateFilter inputs according genome area observed properties. It takes into account reads that are at the frontier of this area and the strand of these reads.
       inputs, ##<< TF inputs to be filtered.
       chr, ##<< Chromosome observed, here chr is an integer.
       x_min, ##<< Coordinate of the first bp observed.
       x_max, ##<< Coordinate of the last bp observed.
       nuc_width = 160, ##<< Nucleosome width.
       only_f = FALSE, ##<< Filter only F reads.
       only_r = FALSE, ##<< Filter only R reads.
       filter_for_coverage = FALSE ##<< Does it filter for plot coverage?
       ) {
       	if (only_f) {
       		inputs = inputs[inputs[,1]==chr & inputs[,2] >= x_min - nuc_width & inputs[,3] == "F" & inputs[,2] <= x_max + nuc_width,]
       	} else if (only_r) {
       		inputs = inputs[inputs[,1]==chr & inputs[,2] >= x_min - nuc_width & inputs[,3] == "R" & inputs[,2] <= x_max + nuc_width,]
       	} else {
       		inputs = inputs[inputs[,1]==chr & inputs[,2] >= x_min - nuc_width & inputs[,2] <= x_max + nuc_width,]
+      	}
         if (!filter_for_coverage) {
           corrected_inputs_coords = inputs[,2] + nuc_width/2 * sign_from_strand(inputs[,3])
           inputs = inputs[inputs[,1]==chr & corrected_inputs_coords >= x_min & corrected_inputs_coords <= x_max,]
+        }
       	return(inputs)
       ### Returns filtred inputs.
+      }
       get_comp_strand = function(
       ### Compute the complementatry strand.
       strand ##<< The original strand.
       ) {
       	apply(t(strand),2, function(n){
       	  if (n=="a") {return("t")}
       		if (n=="t") {return("a")}
       		if (n=="c") {return("g")}
       		if (n=="g") {return("c")}
       	})
       ### Returns the complementatry strand.
+      }
       aggregate_intra_strain_nucs = structure(function(# Aggregate replicated sample's nucleosomes.
       ### This function aggregates nucleosome for replicated samples. It uses TemplateFilter ouput of each sample as replicate. Each sample owns a set of nucleosomes computed using TemplateFilter and ordered by the position of their center. Adajacent nucleosomes are compared two by two. Comparison is based on a log likelihood ratio score. The issue of comparison is adjacents nucleosomes merge or separation. Finally the function returns a list of clusters and all computed \emph{llr_scores}. Each cluster ows an attribute \emph{wp} for "well positionned". This attribute is set as \emph{TRUE} if the cluster is composed of exactly one nucleosomes of each sample.
       samples, ##<< A list of samples. Each sample is a list like \emph{sample = list(id=..., marker=..., strain=..., roi=..., inputs=..., outputs=...)} with \emph{roi = list(name=..., begin=...,  end=..., chr=..., genome=...)}.
       llr_thres=20, ##<< Log likelihood ration threshold.
       coord_max=20000000 ##<< A too big value to be a coord for a nucleosome lower bound.
       ){
       	end_of_tracks = function(tracks) {
       		if (length(tracks) == 0) {
       			return(TRUE)
+      		}
       	  for (lower_bound in tracks) {
       			if(!is.na(lower_bound)) {
       	      if (lower_bound < coord_max) {
       	        return(FALSE)
+      	      }
+      	  	}
+      	  }
       	  return(TRUE)
+      	}
       	store_cluster = function(clusters, new_cluster, nb_nucs_in_cluster,nuc_from_track,nb_tracks, min_nuc_center, max_nuc_center) {
       		if ( nb_nucs_in_cluster==nb_tracks & sum(nuc_from_track)==nb_tracks) {
       			new_cluster$wp = TRUE
       			center = (new_cluster$lower_bound + new_cluster$upper_bound) / 2
       			if (is.null(min_nuc_center) | ((min_nuc_center <= center) & (center < max_nuc_center))) {
       		  	clusters[[length(clusters) + 1]] = new_cluster
       				# print(new_cluster)
+      		  }
       		} else {
       			new_cluster$wp = FALSE
       			center = (new_cluster$lower_bound + new_cluster$upper_bound) / 2
       			if (is.null(min_nuc_center) | ((min_nuc_center <= center) & (center < max_nuc_center))) {
       			  clusters[[length(clusters) + 1]] = new_cluster
+      			}
+      		}
       		return(clusters)
+      	}
       	strain = samples[[1]]$strain
       	llr_scores = c()
         min_nuc_center = min(samples[[1]]$roi$begin, samples[[1]]$roi$end)
       	max_nuc_center = max(samples[[1]]$roi$begin, samples[[1]]$roi$end)
         # compute clusters
         clusters = list()
         cluster_contents = list()
         # Init reader
         indexes = c()
         track_readers = c()
         current_nuc = NULL
       	llr_score = llr_thres + 1
         # Read nucs from TF outputs
         tf_outs = list()
       	i = 1
         for (sample in samples) {
       		tf_outs[[i]] = sample$outputs
       		tf_outs[[i]] = tf_outs[[i]][order(tf_outs[[i]]$center),]
           indexes[i] = 1
       		if (is.na(tf_outs[[i]][indexes[i],]$center)) {
             track_readers[i] = coord_max
       	  } else {
             track_readers[i] = tf_outs[[i]][indexes[i],]$center
+      		}
       		i = i+1
+        }
       	# print(track_readers)
         new_cluster = NULL
         nb_nucs_in_cluster = 0
         nuc_from_track = c()
         for (i in 1:length(tf_outs)){
           nuc_from_track[i] = FALSE
+        }
         # Start clustering
         while (!end_of_tracks(track_readers)) {
           new_center = min(track_readers)
       		current_track = which(track_readers == new_center)[1]
           new_nuc = as.list(tf_outs[[current_track]][indexes[current_track],])
       		new_nuc$chr = substr(new_nuc$chr,4,1000000L)
       		new_nuc$inputs = samples[[current_track]]$inputs
       		new_nuc$chr = samples[[current_track]]$roi$chr
       		new_nuc$track = current_track
       		new_nuc$inputs = filter_tf_inputs(samples[[current_track]]$inputs, new_nuc$chr, new_nuc$lower_bound, new_nuc$upper_bound, new_nuc$width)
       		flatted_reads = flat_reads(new_nuc$inputs, new_nuc$width)
       		new_nuc$original_reads = flatted_reads[[3]]
           new_upper_bound = new_nuc$upper_bound
           if (!is.null(current_nuc)) {
       			llr_score = llr_score_nvecs(list(current_nuc$original_reads,new_nuc$original_reads))
       			llr_scores = c(llr_scores,llr_score)
+      		}
       		# print(paste(llr_score, length(current_nuc$original_reads), length(new_nuc$original_reads), sep=" "))
       		if (is.na(llr_score)) {
       			llr_score = llr_thres + 1
+      		}
       		# Store llr_score
       		new_nuc$llr_score = llr_score
       	  if (llr_score < llr_thres) {
             # aggregate to current cluster
             #   update bound
             if (new_nuc$upper_bound > new_cluster$upper_bound) {
               new_cluster$upper_bound = new_nuc$upper_bound
+            }
             if (new_nuc$lower_bound < new_cluster$lower_bound) {
               new_cluster$lower_bound = new_nuc$lower_bound
+            }
             #   add nucleosome to current cluster
             nuc_from_track[current_track] = TRUE
             nb_nucs_in_cluster = nb_nucs_in_cluster + 1
       			new_cluster$nucs[[length(new_cluster$nucs)+1]] = new_nuc
           } else {
       			if (!is.null(new_cluster)) {
               # store old cluster
       	      clusters = store_cluster(clusters, new_cluster, nb_nucs_in_cluster,nuc_from_track,length(tf_outs),min_nuc_center, max_nuc_center)
+      			}
             # Reinit current cluster composition stuff
             nb_nucs_in_cluster = 0
             nuc_from_track = c()
             for (i in 1:length(tf_outs)){
               nuc_from_track[i] = FALSE
+            }
             # create new cluster
             new_cluster = list(lower_bound=new_nuc$low, upper_bound=new_nuc$up, chr=new_nuc$chr, strain_ref=strain , nucs=list())
             # update upper bound
             current_upper_bound = new_upper_bound
             # add nucleosome to current cluster
             nb_nucs_in_cluster = nb_nucs_in_cluster + 1
             nuc_from_track[current_track] = TRUE
       			new_cluster$nucs[[length(new_cluster$nucs)+1]] = new_nuc
+      		}
       		current_nuc = new_nuc
           # update indexes
           if (indexes[current_track] < length(tf_outs[[current_track]]$center)) {
             indexes[current_track] = indexes[current_track] + 1
             # update track
             track_readers[current_track] = tf_outs[[current_track]][indexes[current_track],]$center
           } else {
             # update track
             track_readers[current_track] = coord_max
+          }
+        }
         # store last cluster
         if (!is.null(new_cluster)) {
           # store old cluster
           clusters = store_cluster(clusters, new_cluster, nb_nucs_in_cluster,nuc_from_track,length(tf_outs),min_nuc_center, max_nuc_center)
+        }
       	return(list(clusters, llr_scores))
       ### Returns a list of clusterized nucleosomes, and all computed llr scores.
       }, ex=function(){
       	# Dealing with a region of interest
       	roi =list(name="example", begin=1000,  end=1300, chr="1", genome=rep("A",301))
       	samples = list()
       	for (i in 1:3) {
       		# Create TF output
       		tf_nuc = list("chr"=paste("chr", roi$chr, sep=""), "center"=(roi$end + roi$begin)/2, "width"= 150, "correlation.score"= 0.9)
       		outputs = dfadd(NULL,tf_nuc)
       		outputs = filter_tf_outputs(outputs, roi$chr, roi$begin, roi$end)
       		# Generate corresponding reads
       		nb_reads = round(runif(1,170,230))
       		reads = round(rnorm(nb_reads, tf_nuc$center,20))
       		u_reads = sort(unique(reads))
       		strands = sample(c(rep("R",ceiling(length(u_reads)/2)),rep("F",floor(length(u_reads)/2))))
       		counts = apply(t(u_reads), 2, function(r) { sum(reads == r)})
       		shifts = apply(t(strands), 2, function(s) { if (s == "F") return(-tf_nuc$width/2) else return(tf_nuc$width/2)})
       		u_reads = u_reads + shifts
       		inputs = data.frame(list("V1" = rep(roi$chr, length(u_reads)),
       		                         "V2" = u_reads,
       														 "V3" = strands,
       														 "V4" = counts), stringsAsFactors=FALSE)
       		samples[[length(samples) + 1]] = list(id=1, marker="Mnase_Seq", strain="strain_ex", total_reads = 10000000, roi=roi, inputs=inputs, outputs=outputs)
+      	}
       	print(aggregate_intra_strain_nucs(samples))
       })
       flat_aggregated_intra_strain_nucs = function(# to flat aggregate_intra_strain_nucs function output
       ### This function builds a dataframe of all clusters obtain from aggregate_intra_strain_nucs function.
       partial_strain_maps, ##<< the output of aggregate_intra_strain_nucs function
       cur_index ##<< the index of the roi involved
       ) {
       	if  (length(partial_strain_maps) == 0 ){
       		print(paste("Empty partial_strain_maps for roi", cur_index, "ands current strain." ))
           tmp_strain_maps = list()
       	} else {
       		tmp_strain_map = apply(t(1:length(partial_strain_maps)), 2, function(i){
       			tmp_nuc = partial_strain_maps[[i]]
       			tmp_nuc_as_list = list()
       			tmp_nuc_as_list[["chr"]] = tmp_nuc[["chr"]]
       			tmp_nuc_as_list[["lower_bound"]] = ceiling(tmp_nuc[["lower_bound"]])
       			tmp_nuc_as_list[["upper_bound"]] = floor(tmp_nuc[["upper_bound"]])
       			tmp_nuc_as_list[["cur_index"]] = cur_index
       			tmp_nuc_as_list[["index_nuc"]] = i
       			tmp_nuc_as_list[["wp"]] = as.integer(tmp_nuc$wp)
       			all_original_reads = c()
       			for (j in 1:length(tmp_nuc$nucs)) {
       				all_original_reads = c(all_original_reads, tmp_nuc$nucs[[j]]$original_reads)
+      			}
       			tmp_nuc_as_list[["nb_reads"]] = length(all_original_reads)
       			tmp_nuc_as_list[["nb_nucs"]] = length(tmp_nuc$nucs)
       			if (tmp_nuc$wp) {
       				tmp_nuc_as_list[["llr_1"]] = signif(tmp_nuc$nucs[[2]]$llr_score,5)
       				tmp_nuc_as_list[["llr_2"]] = signif(tmp_nuc$nucs[[3]]$llr_score,5)
       			} else {
       				tmp_nuc_as_list[["llr_1"]] = NA
       				tmp_nuc_as_list[["llr_2"]] = NA
+      			}
             return(tmp_nuc_as_list)
           })
           tmp_strain_maps = do.call("rbind", tmp_strain_map)
+      	}
         return(data.frame(lapply(data.frame(tmp_strain_maps, stringsAsFactors=FALSE), unlist), stringsAsFactors=FALSE))
       ### Returns a dataframe of all clusters obtain from aggregate_intra_strain_nucs function.
+      }
       align_inter_strain_nucs = structure(function(# Aligns nucleosomes between 2 strains.
       ### This function aligns nucs between two strains for a given genome region.
       replicates, ##<< Set of replicates, ideally 3 per strain.
       wp_nucs_strain_ref1=NULL, ##<< List of aggregates nucleosome for strain 1. If it's null this list will be computed.
       wp_nucs_strain_ref2=NULL, ##<< List of aggregates nucleosome for strain 2. If it's null this list will be computed.
       corr_thres=0.5, ##<< Correlation threshold.
       llr_thres=100, ##<< LOD cut off.
       config=NULL, ##<< GLOBAL config variable
       ... ##<< A list of parameters that will be passed to \emph{aggregate_intra_strain_nucs} if needed.
       ) {
       	if (length(replicates) < 2) {
       		stop("ERROR, align_inter_strain_nucs needs 2 replicate sets.")
       	} else if (length(replicates) > 2) {
       		print("WARNING, align_inter_strain_nucs will use 2 first sets of replicates as inputs.")
+      	}
       	common_nuc = NULL
       	llr_scores = c()
       	chr = replicates[[1]][[1]]$roi$chr
         min_nuc_center = min(replicates[[1]][[1]]$roi$begin, replicates[[1]][[1]]$roi$end)
       	max_nuc_center = max(replicates[[1]][[1]]$roi$begin, replicates[[1]][[1]]$roi$end)
       	strain_ref1 = replicates[[1]][[1]]$strain
       	strain_ref2 = replicates[[2]][[1]]$strain
       	big_cur = replicates[[1]][[1]]$roi
         orig_big_cur = replicates[[1]][[1]]$orig_roi
       	if(big_cur$end - big_cur$begin < 0) {
       		tmp_begin = big_cur$begin
       		big_cur$begin =  big_cur$end
       		big_cur$end =  tmp_begin
+      	}
       	# GO!
       	if (is.null(wp_nucs_strain_ref1)) {
       		wp_nucs_strain_ref1 = aggregate_intra_strain_nucs(replicates[[1]], ...)[[1]]
+      	}
       	if (is.null(wp_nucs_strain_ref2)) {
       	  wp_nucs_strain_ref2 = aggregate_intra_strain_nucs(replicates[[2]], ...)[[1]]
+        }
       	lws = c()
       	ups = c()
       	for (na in wp_nucs_strain_ref2) {
       		lws = c(lws, na$lower_bound)
       		ups = c(ups, na$upper_bound)
+      	}
       	print(paste("Exploring chr" , chr , ", " , length(wp_nucs_strain_ref1) , ", [" , min_nuc_center , ", " , max_nuc_center , "] nucs...", sep=""))
       	roi_strain_ref1 = NULL
       	roi_strain_ref2 = NULL
       	if (length(wp_nucs_strain_ref1) > 0) {
       		for(index_nuc_strain_ref1 in 1:length(wp_nucs_strain_ref1)){
       			# print(paste("" , index_nuc_strain_ref1 , "/" , length(wp_nucs_strain_ref1), sep=""))
       			nuc_strain_ref1 = wp_nucs_strain_ref1[[index_nuc_strain_ref1]]
       			# Filtering on Well Positionned
       			if (nuc_strain_ref1$wp) {
       				roi_strain_ref1 = list(name=paste("strain_chr_id_" , strain_ref1 , "_" , chr , "_" , "i" , "_", sep=""), begin=nuc_strain_ref1$lower_bound, end=nuc_strain_ref1$upper_bound, chr=chr, strain_ref = strain_ref1)
       				roi_strain_ref2 = translate_cur(roi_strain_ref1, strain_ref2, big_cur=orig_big_cur, config=config)
               if (!is.null(roi_strain_ref2)){
       					# LOADING INTRA_STRAIN_NUCS_FILENAME_STRAIN_REF2 FILE(S) TO COMPUTE MATCHING_NAS (FILTER)
       					lower_bound_roi_strain_ref2 = min(roi_strain_ref2$end,roi_strain_ref2$begin)
       					upper_bound_roi_strain_ref2 = max(roi_strain_ref2$end,roi_strain_ref2$begin)
       					matching_nas = which( lower_bound_roi_strain_ref2 <= ups & lws <= upper_bound_roi_strain_ref2)
       					for (index_nuc_strain_ref2 in matching_nas) {
       						nuc_strain_ref2 = wp_nucs_strain_ref2[[index_nuc_strain_ref2]]
       						# Filtering on Well Positionned
           				nuc_strain_ref2_to_roi = list(begin=nuc_strain_ref2$lower_bound, end=nuc_strain_ref2$upper_bound, chr=nuc_strain_ref2$chr, strain_ref = strain_ref2)
       						if (!is.null(translate_cur(nuc_strain_ref2_to_roi, strain_ref1, big_cur=orig_big_cur, config=config)) &
                       nuc_strain_ref2$wp) {
       							# Filtering on correlation Score and collecting reads
       							SKIP = FALSE
       							# TODO: This for loop could be done before working on strain_ref2. Isn't it?
       							reads_strain_ref1 = c()
       							for (nuc in nuc_strain_ref1$nucs){
       								reads_strain_ref1 = c(reads_strain_ref1, nuc$original_reads)
       								if (nuc$corr < corr_thres) {
       									SKIP = TRUE
+      								}
+      							}
       							reads_strain_ref2 = c()
       							for (nuc in nuc_strain_ref2$nucs){
       								reads_strain_ref2 = c(reads_strain_ref2, nuc$original_reads)
       								if (nuc$corr < corr_thres) {
       									SKIP = TRUE
+      								}
+      							}
       							# Filtering on correlation Score
       							if (!SKIP) {
       								# tranlation of reads into strain 2 coords
       								diff = ((roi_strain_ref1$begin + roi_strain_ref1$end) - (roi_strain_ref2$begin + roi_strain_ref2$end)) / 2
       								reads_strain_ref1 = reads_strain_ref1 - rep(diff, length(reads_strain_ref1))
       								llr_score = llr_score_nvecs(list(reads_strain_ref1, reads_strain_ref2))
       								llr_scores = c(llr_scores, llr_score)
       								# Filtering on LOD Score
                       # if (llr_score < llr_thres) {
       								if (TRUE) {
       									tmp_nuc = list()
       									# strain_ref1
       									tmp_nuc[[paste("chr_", strain_ref1, sep="")]] = chr
       									tmp_nuc[[paste("lower_bound_", strain_ref1, sep="")]] = nuc_strain_ref1$lower_bound
       									tmp_nuc[[paste("upper_bound_", strain_ref1, sep="")]] = nuc_strain_ref1$upper_bound
       									tmp_nuc[[paste("mean_", strain_ref1, sep="")]] = signif(mean(reads_strain_ref1),5)
       									tmp_nuc[[paste("sd_", strain_ref1, sep="")]] = signif(sd(reads_strain_ref1),5)
       									tmp_nuc[[paste("nb_reads_", strain_ref1, sep="")]] = length(reads_strain_ref1)
       									tmp_nuc[[paste("index_nuc_", strain_ref1, sep="")]] = index_nuc_strain_ref1
       									# strain_ref2
       									tmp_nuc[[paste("chr_", strain_ref2, sep="")]] = roi_strain_ref2$chr
       									tmp_nuc[[paste("lower_bound_", strain_ref2, sep="")]] = nuc_strain_ref2$lower_bound
       									tmp_nuc[[paste("upper_bound_", strain_ref2, sep="")]] = nuc_strain_ref2$upper_bound
       									tmp_nuc[[paste("means_", strain_ref2, sep="")]] = signif(mean(reads_strain_ref2),5)
       									tmp_nuc[[paste("sd_", strain_ref2, sep="")]] = signif(sd(reads_strain_ref2),5)
       									tmp_nuc[[paste("nb_reads_", strain_ref2, sep="")]] = length(reads_strain_ref2)
       									tmp_nuc[[paste("index_nuc_", strain_ref2, sep="")]] = index_nuc_strain_ref2
       									# common
       									tmp_nuc[["llr_score"]] = signif(llr_score,5)
       									common_nuc = dfadd(common_nuc, tmp_nuc)
+                      }
+      							}
+      						}
+      					}
       				} else {
       		      print("WARNING! No roi for strain ref 2.")
+      			  }
+      		  }
+      		}
       		if(length(unique(common_nuc[,1:3])[,1]) != length((common_nuc[,1:3])[,1])) {
       			index_redundant = which(apply(common_nuc[,1:3][-length(common_nuc[,1]),] ==  common_nuc[,1:3][-1,] ,1,sum) == 3)
       			to_remove_list = c()
       			for (i in 1:length(index_redundant)) {
       				if (common_nuc[index_redundant[i],15] < common_nuc[index_redundant[i]+1,15]) {
       				  to_remove = index_redundant[i]
       				}	 else {
       					to_remove = index_redundant[i] + 1
+      			  }
       				to_remove_list = c(to_remove_list, to_remove)
+      			}
       			common_nuc = common_nuc[-to_remove_list,]
+      		}
       		if(length(unique(common_nuc[,8:10])[,1]) != length((common_nuc[,8:10])[,1])) {
       			index_redundant = which(apply(common_nuc[,8:10][-length(common_nuc[,1]),] == common_nuc[,8:10][-1,] ,1,sum) == 3)
       			to_remove_list = c()
       			for (i in 1:length(index_redundant)) {
       				if (common_nuc[index_redundant[i],15] < common_nuc[index_redundant[i]+1,15]) {
       				  to_remove = index_redundant[i]
       				}	 else {
       					to_remove = index_redundant[i] + 1
+      			  }
       				to_remove_list = c(to_remove_list, to_remove)
+      			}
       			common_nuc = common_nuc[-to_remove_list,]
+      		}
       		return(list(common_nuc, llr_scores))
       	} else {
       		print("WARNING, no nucs for strain_ref1.")
       		return(NULL)
+      	}
       ### Returns a list of clusterized nucleosomes, and all computed llr scores.
       }, ex=function(){
           # Define new translate_cur function...
           translate_cur = function(roi, strain2, big_cur=NULL, config=NULL) {
             return(roi)
+          }
           # Binding it by uncomment follwing lines.
           unlockBinding("translate_cur", as.environment("package:nucleominer"))
           unlockBinding("translate_cur", getNamespace("nucleominer"))
           assign("translate_cur", translate_cur, "package:nucleominer")
           assign("translate_cur", translate_cur, getNamespace("nucleominer"))
           lockBinding("translate_cur", getNamespace("nucleominer"))
           lockBinding("translate_cur", as.environment("package:nucleominer"))
       	# Dealing with a region of interest
       	roi =list(name="example", begin=1000,  end=1300, chr="1", genome=rep("A",301), strain_ref1 = "STRAINREF1")
       	roi2 = translate_cur(roi, roi$strain_ref1)
       	replicates = list()
       	for (j in 1:2) {
       		samples = list()
       		for (i in 1:3) {
       			# Create TF output
       			tf_nuc = list("chr"=paste("chr", roi$chr, sep=""), "center"=(roi$end + roi$begin)/2, "width"= 150, "correlation.score"= 0.9)
       			outputs = dfadd(NULL,tf_nuc)
       			outputs = filter_tf_outputs(outputs, roi$chr, roi$begin, roi$end)
       			# Generate corresponding reads
       			nb_reads = round(runif(1,170,230))
       			reads = round(rnorm(nb_reads, tf_nuc$center,20))
       			u_reads = sort(unique(reads))
       			strands = sample(c(rep("R",ceiling(length(u_reads)/2)),rep("F",floor(length(u_reads)/2))))
       			counts = apply(t(u_reads), 2, function(r) { sum(reads == r)})
       			shifts = apply(t(strands), 2, function(s) { if (s == "F") return(-tf_nuc$width/2) else return(tf_nuc$width/2)})
       			u_reads = u_reads + shifts
       			inputs = data.frame(list("V1" = rep(roi$chr, length(u_reads)),
       			                         "V2" = u_reads,
       															 "V3" = strands,
       															 "V4" = counts), stringsAsFactors=FALSE)
       			samples[[length(samples) + 1]] = list(id=1, marker="Mnase_Seq", strain=paste("strain_ex",j,sep=""), total_reads = 10000000, roi=roi, inputs=inputs, outputs=outputs)
+      		}
       		replicates[[length(replicates) + 1]] = samples
+      	}
       	print(align_inter_strain_nucs(replicates))
       })
       fetch_mnase_replicates = function(# Prefetch data
       ### Fetch and filter inputs and outpouts per region of interest. Organize it per replicates.
       strain, ##<< The strain we want mnase replicatesList of replicates. Each replicates is a vector of sample ids.
       roi, ##<< Region of interest.
       all_samples, ##<< Global list of samples.
       config=NULL, ##<< GLOBAL config variable
       only_fetch=FALSE, ##<< If TRUE, only fetch and not filtering. It is used tio load sample files into memory before forking.
       get_genome=FALSE, ##<< If TRUE, load corresponding genome sequence.
       get_ouputs=TRUE##<< If TRUE, get also ouput corresponding TF output files.
       ) {
       	samples=list()
         samples_ids = unique(all_samples[all_samples$marker == "Mnase_Seq" & all_samples$strain == strain,]$id)
       	for (i in samples_ids) {
       		sample = as.list(all_samples[all_samples$id==i,])
           sample$orig_roi = roi
           sample$roi = translate_cur(roi, sample$strain, config = config)
       		if (get_genome) {
       			# Get Genome
             sample$roi$genome = get_content(config$FASTA_REFERENCE_GENOME_FILES[[sample$strain]], "fasta")[[switch_pairlist(config$FASTA_INDEXES[[sample$strain]])[[sample$roi$chr]]]][sample$roi$begin:sample$roi$end]
+      		}
       		# Get inputs
       		sample$inputs = get_content(paste(config$ALIGN_DIR, "/TF/sample_", i, "_TF.txt", sep=""), "table", stringsAsFactors=FALSE)
       		sample$total_reads = sum(sample$inputs[,4])
       		if (!only_fetch) {
       		  sample$inputs = filter_tf_inputs(sample$inputs, sample$roi$chr, min(sample$roi$begin, sample$roi$end), max(sample$roi$begin, sample$roi$end), 300)
+      	  }
       	  # Get TF outputs for Mnase_Seq samples
       		if (sample$marker == "Mnase_Seq" & get_ouputs) {
       			sample$outputs = get_content(paste(config$ALIGN_DIR, "/TF/sample_", i, "_all_nucs.tab", sep=""), "table", header=TRUE, sep="\t")
       			if (!only_fetch) {
       	  		sample$outputs = filter_tf_outputs(sample$outputs, sample$roi$chr,  min(sample$roi$begin, sample$roi$end), max(sample$roi$begin, sample$roi$end), 300)
+        		}
+      		}
       		samples[[length(samples) + 1]] = sample
+      	}
         return(samples)
+      }
       substract_region = function(# Substract to a list of regions an other list of regions that intersect it.
       ### This fucntion embed a recursive part. It occurs when a substracted region split an original region on two.
       region1, ##<< Original regions.
       region2 ##<< Regions to substract.
       ) {
         rec_substract_region = function(region1, region2) {
         non_inter_fuzzy = apply(t(1:length(region1[,1])), 2, function(i) {
           cur_fuzzy = region1[i,]
           inter_wp = region2[region2$lower_bound <= cur_fuzzy$upper_bound & region2$upper_bound >= cur_fuzzy$lower_bound,]
           if (length(inter_wp[,1]) > 0) {
             ret = c()
             for (j in 1:length(inter_wp[,1])) {
               cur_wp = inter_wp[j,]
               if (cur_wp$lower_bound <= cur_fuzzy$lower_bound & cur_fuzzy$upper_bound <= cur_wp$upper_bound) {
                 # remove cur_fuzzy
                 ret = c()
                 break
               } else if (cur_wp$lower_bound <= cur_fuzzy$lower_bound & cur_wp$upper_bound < cur_fuzzy$upper_bound) {
                 # crop fuzzy
                 cur_fuzzy$lower_bound = cur_wp$upper_bound + 1
                 ret = cur_fuzzy
               } else if (cur_fuzzy$lower_bound < cur_wp$lower_bound & cur_fuzzy$upper_bound <= cur_wp$upper_bound) {
                 # crop fuzzy
                 cur_fuzzy$upper_bound = cur_wp$lower_bound - 1
                 ret = cur_fuzzy
               } else if (cur_wp$lower_bound > cur_fuzzy$lower_bound & cur_wp$upper_bound < cur_fuzzy$upper_bound) {
                 # split fuzzy
                 tmp_ret_fuzzy_1 = cur_fuzzy
                 tmp_ret_fuzzy_1$upper_bound = cur_wp$lower_bound - 1
                 tmp_ret_fuzzy_2 = cur_fuzzy
                 tmp_ret_fuzzy_2$lower_bound = cur_wp$upper_bound + 1
                 ret = rec_substract_region(rbind(tmp_ret_fuzzy_1, tmp_ret_fuzzy_2), inter_wp)
                 # print(ret)
                 # ret = cur_fuzzy
                 break
               } else {
                 stop("WARNING NO ADAPTED CASE!")
+              }
+            }
             return(ret)
           } else {
             return(cur_fuzzy)
+          }
         })
+        }
         non_inter_fuzzy = rec_substract_region(region1[,1:4], region2[,1:4])
         if (is.null(non_inter_fuzzy)) {return(non_inter_fuzzy)}
         tmp_ulist = unlist(non_inter_fuzzy)
         tmp_names = names(tmp_ulist)[1:4]
         non_inter_fuzzy = data.frame(matrix(tmp_ulist, ncol=4, byrow=TRUE), stringsAsFactors=FALSE)
         names(non_inter_fuzzy) = tmp_names
         non_inter_fuzzy$chr = as.character(non_inter_fuzzy$chr)
         non_inter_fuzzy$chr = as.numeric(non_inter_fuzzy$chr)
         non_inter_fuzzy$lower_bound = as.numeric(non_inter_fuzzy$lower_bound)
         non_inter_fuzzy$upper_bound = as.numeric(non_inter_fuzzy$upper_bound)
         non_inter_fuzzy = non_inter_fuzzy[order(non_inter_fuzzy$lower_bound),]
         return(non_inter_fuzzy)
+      }
       union_regions = function(# Aggregate regions that intersect themnselves.
       ### This function is based on sort of lower bounds to detect regions that intersect. We compare lower bound and upper bound of the porevious item. This function embed a while loop and break break regions list become stable.
       regions ##<< The Regions to be aggregated
       ) {
         if (is.null(regions)) {return(regions)}
         if (nrow(regions) == 0) {return(regions)}
         old_length = length(regions[,1])
         new_length = 0
         while (old_length != new_length) {
           regions = regions[order(regions$lower_bound), ]
           regions$stop = !c(regions$lower_bound[-1] - regions$upper_bound[-length(regions$lower_bound)] <= 1, TRUE)
           vec_end_1 = which(regions$stop)
           if (length(vec_end_1) == 0) {
             vec_end_1 = c(length(regions$stop))
+          }
           if (vec_end_1[length(vec_end_1)] != length(regions$stop)) {
             vec_end_1 = c(vec_end_1, length(regions$stop))
+          }
           vec_beg_1 = c(1, vec_end_1[-length(vec_end_1)] + 1)
           union = apply(t(1:length(vec_beg_1)), 2, function(i) {
             chr = regions$chr[vec_beg_1[i]]
             lower_bound = min(regions$lower_bound[vec_beg_1[i]:vec_end_1[i]])
             upper_bound = max(regions$upper_bound[vec_beg_1[i]:vec_end_1[i]])
             cur_index = regions$cur_index[vec_beg_1[i]]
             data.frame(list(chr=chr, lower_bound=lower_bound, upper_bound=upper_bound, cur_index=cur_index))
             })
           union = collapse_regions(union)
           old_length = length(regions[,1])
           new_length = length(union[,1])
           regions = union
+        }
         return(union)
+      }
       # remove_aligned_wp = function(# Remove wp nucs from common nucs list.
       # ### It is based on common wp nucs index on nucs and region.
       # strain_maps, ##<< Nuc maps.
       # cur_index, ##<< The region of interest index.
       # tmp_common_nucs, ##<< the list of wp nucs.
       # strain##<< The strain to consider.
       # ){
       #   fuzzy_nucs = strain_maps[[strain]]
       #   fuzzy_nucs = fuzzy_nucs[fuzzy_nucs$cur_index == cur_index,]
       #   fuzzy_nucs = fuzzy_nucs[order(fuzzy_nucs$index_nuc),]
       #   if (length(fuzzy_nucs[,1]) == 0) {return(fuzzy_nucs)}
       #   if (sum(fuzzy_nucs$index_nuc == min(fuzzy_nucs$index_nuc):max(fuzzy_nucs$index_nuc)) != max(fuzzy_nucs$index_nuc)) {"Warning in index!"}
       #   anti_index_1 = tmp_common_nucs[[paste("index_nuc", strain, sep="_")]]
       #   fuzzy_nucs = fuzzy_nucs[-anti_index_1,]
       #   return(fuzzy_nucs)
       # }
       translate_regions = function(# Translate a list of regions from a strain ref to another.
       ### This function is an eloborated call to translate_cur.
       regions, ##<< Regions to be translated.
       combi, ##<< Combination of strains.
       cur_index, ##<< The region of interest index.
       config=NULL, ##<< GLOBAL config variable
       roi ##<< The region of interest.
       ) {
         tr_regions = apply(t(1:length(regions[,1])), 2, function(i) {
           tmp_regions_ref2 = list(name="foo", begin=regions[i,]$lower_bound, end=regions[i,]$upper_bound, chr=as.character(regions[i,]$chr), strain_ref = combi[2])
           big_cur =  roi
           trs_tmp_regions_ref2 = translate_cur(tmp_regions_ref2, combi[1], config = config, big_cur = big_cur)
           if (is.null(trs_tmp_regions_ref2)) {
             return(NULL)
           } else {
             return(data.frame(list(chr=trs_tmp_regions_ref2$chr, lower_bound=min(trs_tmp_regions_ref2$begin, trs_tmp_regions_ref2$end), upper_bound=max(trs_tmp_regions_ref2$begin, trs_tmp_regions_ref2$end), cur_index=cur_index)))
+          }
         })
         return(collapse_regions(tr_regions))
+      }
       collapse_regions = function(# reformat an "apply  manipulated" list of regions
       ### Utils to reformat an "apply  manipulated" list of regions
       regions ##< a list of regions
       ) {
         if (is.null(regions)) {
           return(NULL)
         } else {
           regions = do.call(rbind, regions)
           regions$chr = as.character(regions$chr)
           regions$chr = as.numeric(regions$chr)
           regions$lower_bound = as.numeric(regions$lower_bound)
           regions$upper_bound = as.numeric(regions$upper_bound)
           regions = regions[order(regions$lower_bound),]
           return(regions)
+        }
+      }
       crop_fuzzy = function(# Crop bound of regions according to region of interest bound
       ### The fucntion is no more necessary since we remove "big_cur" bug in translate_cur function.
       tmp_fuzzy_nucs, ##<< the regiuons to be croped.
       roi, ##<< The region of interest.
       strain, ##<< The strain to consider.
       config=NULL ##<< GLOBAL config variable
       ) {
         tr_roi = translate_cur(roi, strain, config = config)
         tr_roi_begin = min(tr_roi$begin, tr_roi$end)
         tr_roi_end = max(tr_roi$begin, tr_roi$end)
         if (length(tmp_fuzzy_nucs[tmp_fuzzy_nucs$lower_bound < tr_roi_begin,1]) > 0) {
           tmp_fuzzy_nucs[tmp_fuzzy_nucs$lower_bound < tr_roi_begin,]$lower_bound = tr_roi_begin
+        }
         if (length(tmp_fuzzy_nucs[tmp_fuzzy_nucs$upper_bound < tr_roi_begin,1]) > 0) {
           tmp_fuzzy_nucs[tmp_fuzzy_nucs$upper_bound < tr_roi_begin,]$upper_bound = tr_roi_begin
+        }
         if (length(tmp_fuzzy_nucs[tmp_fuzzy_nucs$lower_bound > tr_roi_end,1]) > 0) {
           tmp_fuzzy_nucs[tmp_fuzzy_nucs$lower_bound > tr_roi_end,]$lower_bound = tr_roi_end
+        }
         if (length(tmp_fuzzy_nucs[tmp_fuzzy_nucs$upper_bound > tr_roi_end,1]) > 0) {
           tmp_fuzzy_nucs[tmp_fuzzy_nucs$upper_bound > tr_roi_end,]$upper_bound = tr_roi_end
+        }
         tmp_fuzzy_nucs = tmp_fuzzy_nucs[tmp_fuzzy_nucs$upper_bound != tmp_fuzzy_nucs$lower_bound,]
         return(tmp_fuzzy_nucs)
+      }
       get_all_reads = function(# Retrieve Reads
       ### Retrieve reads for a given marker, combi, form.
       marker, ##<< The marker to considere.
       combi, ##<< The starin combination to considere.
       form="wp", ##<< The nuc form to considere.
       config=NULL ##<< GLOBAL config variable
       ) {
       	all_reads = NULL
         for (manip in c("Mnase_Seq", marker)) {
           if (form == "unr") {
       		  out_filename = paste(config$RESULTS_DIR, "/",combi[1],"_",combi[2],"_",manip,"_unr_and_nbreads.tab",sep="")
         		tmp_res = read.table(file=out_filename, header=TRUE)
       			tmp_res = tmp_res[tmp_res[,3] - tmp_res[,2] > 75,]
             tmp_res$form = form
           } else if (form == "wp") {
       		 	out_filename = paste(config$RESULTS_DIR, "/",combi[1],"_",combi[2],"_",manip,"_wp_and_nbreads.tab",sep="")
         		tmp_res = read.table(file=out_filename, header=TRUE)
             tmp_res$form = form
           } else if (form == "wpunr") {
       		 	out_filename = paste(config$RESULTS_DIR, "/",combi[1],"_",combi[2],"_",manip,"_wp_and_nbreads.tab",sep="")
         		tmp_res = read.table(file=out_filename, header=TRUE)
             tmp_res$form = "wp"
       		  out_filename = paste(config$RESULTS_DIR, "/",combi[1],"_",combi[2],"_",manip,"_unr_and_nbreads.tab",sep="")
         		tmp_res2 = read.table(file=out_filename, header=TRUE)
       			tmp_res2 = tmp_res2[tmp_res2[,3] - tmp_res2[,2] > 75,]
             tmp_res2$form = "unr"
             tmp_res = rbind(tmp_res, tmp_res2)
+          }
       		if (is.null(all_reads)) {
       			all_reads = tmp_res[,c(1:9,length(tmp_res))]
+      		}
       		tmp_res = tmp_res[,-c(1:9,length(tmp_res))]
       		all_reads = cbind(all_reads, tmp_res)
+        }
         return(all_reads)
+      }
       get_design = function(# Build the design for deseq
       ### This function build the design according sample properties.
       marker, ##<< The marker to considere.
       combi, ##<< The starin combination to considere.
       all_samples ##<< Global list of samples.
       ) {
         off1 = 0
         off2 = 0
       	manips = c("Mnase_Seq", marker)
       	design_rownames = c()
       	design_manip = c()
       	design_strain = c()
         off2index = function(off) {
         	switch(toString(off),
         		"1"=c(0,1,1),
         	  "2"=c(1,0,1),
           	"3"=c(1,1,0),
         		c(1,1,1)
+        		)
+        }
       	for (manip in manips) {
       		tmp_samples = all_samples[ ((all_samples$strain == combi[1] | all_samples$strain == combi[2]) &  all_samples$marker == manip), ]
       		tmp_samples = tmp_samples[order(tmp_samples$strain), ]
       		if (manip == "H3K4me1" & (off1 != 0 & off2 ==0 )) {
       			tmp_samples = tmp_samples[c(off2index(off1), c(1,1)) == 1,]
       		} else {
       			if (manip != "Mnase_Seq" & (off1 != 0 | off2 !=0)) {
       				tmp_samples = tmp_samples[c(off2index(off1), off2index(off2)) == 1,]
+      			}
+      		}
       		design_manip = c(design_manip, rep(manip, length(tmp_samples$id)))
       		for (strain in combi) {
       			cols = apply(t(tmp_samples[ (tmp_samples$strain == strain &  tmp_samples$marker == manip), ]$id), 2, function(i){paste(strain, manip, i, sep="_")})
       			design_strain = c(design_strain, rep(strain, length(cols)))
       			design_rownames = c(design_rownames, cols)
+      		}
+      	}
       	snep_design = data.frame( row.names=design_rownames, manip=design_manip, strain=design_strain)
       	return(snep_design)
+      }
       plot_dist_samples = function(# Plot the distribution of reads.
       ### This fuxntion use the deseq nomalization feature to compare qualitatively the distribution.
       strain, ##<< The strain to considere.
       marker, ##<< The marker to considere.
       res, ##<< Data
       all_samples, ##<< Global list of samples.
       NEWPLOT = TRUE ##<< If FALSE the curve will be add to the current plot.
       ) {
       	cols = apply(t(all_samples[ (all_samples$strain == strain &  all_samples$marker == marker), ]$id), 2, function(i){paste(strain, marker, i, sep="_")})
       	snepCountTable = res[,cols]
       	snepDesign = data.frame(
       		row.names = cols,
       		manip = rep(marker, length(cols)),
       		strain = rep(strain, length(cols))
+      		)
       	cdsFull = newCountDataSet(snepCountTable, snepDesign)
       	sizeFactors = estimateSizeFactors(cdsFull)
       	# print(sizeFactors[[1]])
       	sample_ids = all_samples[ (all_samples$strain == strain &  all_samples$marker == marker), ]$id
       	if (NEWPLOT) {
       		plot(density(res[,paste(strain, marker, sample_ids[1], sep="_")] / sizeFactors[[1]][1]), col=0, main=paste(strain, marker))
       		NEWPLOT = FALSE
+      	}
       	for (it in 1:length(sample_ids)) {
       		sample_id = sample_ids[it]
       		lines(density(res[,paste(strain, marker, sample_id, sep="_")] / sizeFactors[[1]][it]), col = it + 1, lty = it)
+      	}
         legend("topright", col=(1:length(sample_ids))+1, lty=1:length(sample_ids), legend=cols)
+      }
       analyse_design = function(# Launch deseq methods.
       ### This function is based on deseq example. It mormalizes data, fit data to GLM model with and without interaction term and compare the two l;=models.
       snep_design, ##<< The design to considere.
       reads ##<< The data to considere.
       ) {
       	snep_count_table = reads[, rownames(snep_design)]
       	cdsFull = newCountDataSet(snep_count_table, snep_design)
       	cdsFull1 = estimateDispersions(estimateSizeFactors(cdsFull), fitType="local", method="pooled", sharingMode="maximum")
       	fit1 = fitNbinomGLMs(cdsFull1, count ~ manip * strain)
       	cdsFull0 = estimateDispersions(estimateSizeFactors(cdsFull), fitType="local", method="pooled", sharingMode="maximum")
       	fit0 = fitNbinomGLMs(cdsFull0, count ~ manip + strain)
       	pvalsGLM = nbinomGLMTest( fit1, fit0 )
       	return(list(fit1, fit0, snep_design, pvalsGLM))
+      }
       get_sneps = structure(function(# Compute the list of SNEPs for a given set of marker, strain combination and nuc form.
       ### This function uses
       marker, ##<< The marker involved.
       combi, ##<< The strain combination involved.
       form, ##<< the nuc form involved.
       all_samples, ##<< Global list of samples.
       config=NULL ##<< GLOBAL config variable
       ) {
         # PRETREAT
         snep_design = get_design(marker, combi, all_samples)
         reads = get_all_reads(marker, combi, form, config=config)
         # RUN ANALYSE
         tmp_analyse = analyse_design(snep_design, reads)
         # RESULTS
       	fit1 = tmp_analyse[[1]]
       	fit0 = tmp_analyse[[2]]
         k = names(fit1)
         reads[[k[2]]] = signif(fit1[[k[2]]], 5)
         reads[[k[3]]] = signif(fit1[[k[3]]], 5)
         reads[[k[4]]] = signif(fit1[[k[4]]], 5)
       	reads$pvalsGLM = signif(tmp_analyse[[4]], 5)
       	snep_design = tmp_analyse[[3]]
         # print(snep_design)
       	fdr = 0.0001
       	thres = FDR(reads$pvalsGLM, fdr)
       	reads$snep_index = reads$pvalsGLM < thres
       	print(paste(sum(reads$snep_index), " SNEPs found for ", length(reads[,1])," nucs and ", fdr*100,"% of FDR.", sep = ""))
         return(reads)
         },  ex=function(){
           marker = "H3K4me1"
           combi = c("BY", "YJM")
           form = "wpunr" # "wp" | "unr" | "wpunr"
           # foo = get_sneps(marker, combi, form)
           # foo = get_sneps("H4K12ac", c("BY", "RM"), "wp")
       })
       ROM2ARAB = function(# Roman to Arabic pair list.
       ### Util to convert Roman to Arabic
       ){list(
         "I" = 1,
         "II" = 2,
         "III" = 3,
         "IV" = 4,
         "V" = 5,
         "VI" = 6,
         "VII" = 7,
         "VIII" = 8,
         "IX" = 9,
         "X" = 10,
         "XI" = 11,
         "XII" = 12,
         "XIII" = 13,
         "XIV" = 14,
         "XV" = 15,
         "XVI" = 16,
         "XVII" = 17,
         "XVIII" = 18,
         "XIX" = 19,
         "XX" = 20
       )}
       switch_pairlist = structure(function(# Switch a pairlist
       ### Take a pairlist key:value and return the switched pairlist value:key.
       l ##<< The pairlist to switch.
       ) {
       	ret = list()
       	for (name in names(l)) {
       		ret[[as.character(l[[name]])]] = name
+      	}
       	ret
       ### The switched pairlist.
       }, ex=function(){
       	l = list(key1 = "value1", key2 = "value2")
       	print(switch_pairlist(l))
       })
       ARAB2ROM = function(# Arabic to Roman pair list.
       ### Util to convert Arabicto Roman
       ){switch_pairlist(ROM2ARAB())}
       c2c_extraction = function(# Extract a sub part of the corresponding c2c file
       ### This fonction allow to acces to a specific part of the c2c file.
       strain1, ##<< the key strain
       strain2, ##<< the target strain
       chr=NULL, ##<< if defined, the c2c will filtered according to the chromosome value
       lower_bound=NULL, ##<< if defined, the c2c will filtered for part of the genome upper than lower_bound
       upper_bound=NULL, ##<< if defined, the c2c will filtered for part of the genome lower than upper_bound
       config=NULL##<<  GLOBAL config variable
       ) {
         reverse = (strain1=="RM" & strain2=="BY") | strain1=="YJM"
       	# Launch c2c file
       	if (reverse) {
       		c2c_filename = config$C2C_FILES[[paste(strain2, "-", strain1, sep="")]]
       	} else {
       		c2c_filename = config$C2C_FILES[[paste(strain1, "-", strain2, sep="")]]
+      	}
       	c2c = get_content(c2c_filename, "table", stringsAsFactors=FALSE)
         # Filtering unagapped
         c2c = c2c[c2c$V6=="-",]
       	# Reverse
       	if (reverse) {
       		tmp_col = c2c$V1
       		c2c$V1 = c2c$V7
       		c2c$V7 = tmp_col
       		tmp_col = c2c$V2
       		c2c$V2 = c2c$V9
       		c2c$V9 = tmp_col
       		tmp_col = c2c$V3
       		c2c$V3 = c2c$V10
       		c2c$V10 = tmp_col
+      	}
         if (!is.null(chr)) {
         	if (strain1 == "BY") {
         		chro_1 = paste("chr", ARAB2ROM()[[chr]], sep="")
         	} else if (strain1 == "RM") {
         	  chro_1 = paste("supercontig_1.",chr,sep="")
         	} else if (strain1 == "YJM") {
         	  chro_1 = switch_pairlist(config$FASTA_INDEXES$YJM)[[chr]]
+        	}
         	c2c = c2c[c2c$V1 == chro_1,]
           if (!is.null(lower_bound)) {
             if (length(c2c[c2c$V3 < lower_bound & c2c$V2 < c2c$V3, 1] > 0)) {c2c[c2c$V3 < lower_bound & c2c$V2 < c2c$V3,c("V2", "V3") ] = lower_bound}
             if (length(c2c[c2c$V2 < lower_bound & c2c$V3 < c2c$V2, 1] > 0)) {c2c[c2c$V2 < lower_bound & c2c$V3 < c2c$V2,c("V2", "V3") ] = lower_bound}
             c2c = c2c[c2c$V2 - c2c$V3 != 0,]
+          }
           if (!is.null(upper_bound)) {
             if (length(c2c[c2c$V2 > upper_bound & c2c$V2 < c2c$V3, 1] > 0)) {c2c[c2c$V2 > upper_bound & c2c$V2 < c2c$V3, c("V2", "V3")] = upper_bound}
             if (length(c2c[c2c$V3 > upper_bound & c2c$V3 < c2c$V2, 1] > 0)) {c2c[c2c$V3 > upper_bound & c2c$V3 < c2c$V2, c("V2", "V3")] = upper_bound}
             c2c = c2c[c2c$V2 - c2c$V3 != 0,]
+          }
+        }
         return(c2c)
       # It retruns the appropriate c2c file part.
+      }
       translate_cur = structure(function(# Translate coords of a genome region.
       ### This function is used in the examples, usualy you have to define your own translation function and overwrite this one using \emph{unlockBinding} features. Please, refer to the example.
       roi, ##<< Original genome region of interest.
       strain2, ##<< The strain in wich you want the genome region of interest.
       config=NULL, ##<< GLOBAL config variable
       big_cur=NULL ##<< A largest region than roi use to filter c2c if it is needed.
       ) {
       	strain1 = roi$strain_ref
       	if (strain1 == strain2) {
       		roi$length = roi$end - roi$begin + sign(roi$end - roi$begin) * 1
       		return(roi)
+      	}
       	# Extract c2c file
       	if (!is.null(big_cur)) {
         	# Dealing with big_cur
       		if (roi$strain_ref != big_cur$strain_ref) {
             big_cur = translate_cur(big_cur, roi$strain_ref, config=config)
+          }
           if (big_cur$end < big_cur$begin) {
             tmp_var = big_cur$begin
             big_cur$begin = big_cur$end
             big_cur$end = tmp_var
             big_cur$length = big_cur$end - big_cur$begin + 1
+          }
           if (big_cur$chr!=roi$chr | roi$end > big_cur$end | roi$end < big_cur$begin | roi$begin > big_cur$end | roi$begin < big_cur$begin) {
             print("WARNING! Trying to translate a roi not included in a big_cur.")
             return(NULL)
+          }
         	c2c = c2c_extraction(strain1, strain2, big_cur$chr, big_cur$begin, big_cur$end, config=config)
         } else {
           # No big_cur
         	c2c = c2c_extraction(strain1, strain2, roi$chr, config=config)
+        }
         #	Convert initial roi$chr into c2c format
         reverse = (strain1=="RM" & strain2=="BY") | strain1=="YJM"
       	begin_1 = roi$begin
         end_1 = roi$end
         if (reverse) {
         	tmptransfostart = c2c[(c2c$V3>=begin_1 & c2c$V2<=begin_1 & c2c$V8==1) | (c2c$V2>=begin_1 & c2c$V3<=begin_1 & c2c$V8==-1),]
           tmptransfostop = c2c[(c2c$V3>=end_1   & c2c$V2<=end_1   & c2c$V8==1) | (c2c$V2>=end_1   & c2c$V3<=end_1   & c2c$V8==-1),]
       	} else {
       		tmptransfostart = c2c[c2c$V3>=begin_1 & c2c$V2<=begin_1,]
       	  tmptransfostop = c2c[c2c$V3>=end_1 & c2c$V2<=end_1,]
+      	}
       	# Never happend conditions ...
+      	{
       		if (length(tmptransfostart$V8) == 0) {
       			# begin_1 is between to lines: shift begin_1 to the start of 2nd line.
             if (sum(c2c$V3 >= c2c$V2) != 0) {
         			tmp_c2c = c2c[c2c$V2>=begin_1,]
         			begin_1 = min(tmp_c2c$V2)
             } else {
         			tmp_c2c = c2c[c2c$V3>=begin_1,]
         			begin_1 = min(tmp_c2c$V3)
+            }
       			if (reverse) {
       		  	tmptransfostart = c2c[(c2c$V3>=begin_1 & c2c$V2<=begin_1 & c2c$V8==1) | (c2c$V2>=begin_1 & c2c$V3<=begin_1 & c2c$V8==-1),]
       			} else {
       				tmptransfostart = c2c[c2c$V3>=begin_1 & c2c$V2<=begin_1,]
+      			}
       			if (length(tmptransfostart$V8) == 0) {
       				if (!is.null(big_cur)) {
       					return(NULL)
       					tmptransfostart = c2c[c2c$V3>=big_cur$begin & c2c$V2<=big_cur$begin,]
       				} else {
       					print(tmptransfostart)
       					print(tmptransfostop)
       					stop("Never happend condition 1.")
+      				}
+      			}
+      		}
       		if (length(tmptransfostop$V8) == 0) {
       			# end_1 is between to lines: shift end_1 to the end of 2nd line.
             if (sum(c2c$V3 >= c2c$V2) != 0) {
         			tmp_c2c = c2c[c2c$V3<=end_1,]
         			end_1 = max(tmp_c2c$V3)
             } else {
         			tmp_c2c = c2c[c2c$V2<=end_1,]
         			end_1 = max(tmp_c2c$V2)
+            }
       			if (reverse) {
       		    tmptransfostop = c2c[(c2c$V3>=end_1   & c2c$V2<=end_1   & c2c$V8==1) | (c2c$V2>=end_1   & c2c$V3<=end_1   & c2c$V8==-1),]
       			} else {
       			  tmptransfostop = c2c[c2c$V3>=end_1 & c2c$V2<=end_1,]
+      			}
       			if (length(tmptransfostop$V8) == 0) {
       				if (!is.null(big_cur)) {
       					return(NULL)
       				  tmptransfostop = c2c[c2c$V3>=big_cur$end & c2c$V2<=big_cur$end,]
       				} else {
       					print(tmptransfostart)
       					print(tmptransfostop)
       					stop("Never happend condition 2.")
+      				}
+      			}
+      		}
       		if (length(tmptransfostart$V8) != 1) {
       			# print("many start")
       			tmptransfostart = tmptransfostart[tmptransfostart$V3>=begin_1 & tmptransfostart$V2==begin_1,]
       			if (length(tmptransfostart$V8) != 1) {
       				print(tmptransfostart)
       				print(tmptransfostop)
         			stop("Never happend condition 3.")
+      			}
+      		}
       		if (length(tmptransfostop$V8) != 1) {
       			# print("many stop")
       		  tmptransfostop = tmptransfostop[tmptransfostop$V3==end_1 & tmptransfostop$V2<=end_1,]
       			if (length(tmptransfostop$V8) != 1) {
       				print(tmptransfostart)
       				print(tmptransfostop)
         			stop("Never happend condition 4.")
+      			}
+      		}
       		if (tmptransfostart$V7 != tmptransfostop$V7) {
       			print(tmptransfostart)
       			print(tmptransfostop)
        			stop("Problem with genome region of interest of strain 1. \nIt is translated over many contigs into strain 2 ref. \nSorry, but you have to redefine your region of interest.")
+      		}
+      	}
         # Deal with strand
         if (tmptransfostart$V8 == 1) {
           begin_2 = tmptransfostart$V9 + (begin_1 - tmptransfostart$V2)
           end_2 = tmptransfostop$V9 + (end_1 - tmptransfostop$V2)
         } else {
           begin_2 = tmptransfostart$V9 - (begin_1 - tmptransfostart$V2)
           end_2 = tmptransfostop$V9 - (end_1 - tmptransfostop$V2)
+        }
       	# Build returned roi
       	roi$strain_ref = strain2
       	if (roi$strain_ref == "BY") {
       		roi$chr = ROM2ARAB()[[substr(tmptransfostart$V7, 4, 12)]]
       	} else {
       		roi$chr = config$FASTA_INDEXES[[strain2]][[tmptransfostart$V7]]
+      	}
         roi$begin = begin_2
         roi$end = end_2
       	if (sign(roi$end - roi$begin) == 0) {
       		roi$length = 1
       	} else {
       		roi$length = roi$end - roi$begin + sign(roi$end - roi$begin) * 1
+      	}
         return(roi)
       }, ex=function(){
       	# Define new translate_cur function...
       	translate_cur = function(roi, strain2, config) {
       		strain1 = roi$strain_ref
       		if (strain1 == strain2) {
       			return(roi)
       		} else {
       		  stop("Here is my new translate_cur function...")
+      		}
+      	}
       	# Binding it by uncomment follwing lines.
       	# unlockBinding("translate_cur", as.environment("package:nm"))
       	# unlockBinding("translate_cur", getNamespace("nm"))
       	# assign("translate_cur", translate_cur, "package:nm")
       	# assign("translate_cur", translate_cur, getNamespace("nm"))
       	# lockBinding("translate_cur", getNamespace("nm"))
       	# lockBinding("translate_cur", as.environment("package:nm"))
       })
       compute_inter_all_strain_curs = function (# Compute Common Uninterrupted Regions (CUR)
       ### CURs are regions that can be aligned between the genomes
       diff_allowed = 30, ##<< the maximum indel width allowe din a CUR
       min_cur_width = 4000, ##<< The minimum width of a CUR
       config = NULL ##<< GLOBAL config variable
       ) {
         check_overlaping = function(strain1, strain2, chr, lower_bound, upper_bound, config=NULL) {
           c2c = c2c_extraction(strain1, strain2, chr, lower_bound, upper_bound, config=config)
           check_homogeneity(c2c)
         	if (length(c2c[,1]) == 0 ) {
             stop("WARNING! checking overlapping for a region corresponding to an empty c2c.")
           } else {
         		lower_bounds = apply(t(1:nrow(c2c)), 2,function(i){l = c2c[i,]; min(l$V2, l$V3)})
         		upper_bounds = apply(t(1:nrow(c2c)), 2,function(i){l = c2c[i,]; max(l$V2, l$V3)})
         		tmp_index = order(lower_bounds)
             lower_bounds = lower_bounds[tmp_index]
             upper_bounds = upper_bounds[tmp_index]
             tmp_diff = lower_bounds[-1] - upper_bounds[-length(upper_bounds)]
             ov_index = which(tmp_diff < 0)
             if(length(ov_index < 0) !=0 ) {
               ov_index = ov_index[1]
               print(paste("WARNING! Overlaping", " (", strain1, ",", strain2, ") chr: ", c2c[1,]$V1, sep=""))
               c2c_corrupted = c2c[tmp_index,][c(ov_index, ov_index + 1),]
               print(c2c_corrupted)
               return(list(lower_bounds[ov_index+1] - 1, upper_bounds[ov_index] + 1))
+            }
             return(NULL)
+          }
+        }
         check_homogeneity = function(sub_c2c) {
           tmp_signs = sign(sub_c2c$V2 - sub_c2c$V3)
           tmp_signs = tmp_signs[tmp_signs != 0]
         	if (sum(tmp_signs[1]  != tmp_signs)) {
         		print(paste("*************** ERROR, non homogenous region (sign)! ********************"))
             print(tmp_signs)
+        	}
           tmp_signs2 = sign(sub_c2c$V9 - sub_c2c$V10)
           tmp_signs2 = tmp_signs2[tmp_signs2 != 0]
         	if (sum(tmp_signs2[1]  != tmp_signs2)) {
         		print(paste("*************** ERROR, non homogenous region (sign2)! ********************"))
             print(tmp_signs2)
+        	}
         	if (length(unique(sub_c2c[,c(1,7,8)])[,2]) != 1) {
         		print("*************** ERROR, non homogenous region chrs or V8! ********************")
+        	}
+        }
         test_and_squeeze_rois = function(foo, config=NULL) {
           is_it_ok = function(list1, list2) {
             bar = cbind(list1$begin, list2$begin, abs(list1$begin - list2$begin), list1$end, list2$end, abs(list1$end - list2$end), list1$length, list2$length, abs(list1$length - list2$length))
             ok = length(bar[bar[,3] != 0 | bar[,6] != 0, ]) == 0
             if (!ok) {
               print(bar[bar[,3] != 0 | bar[,6] != 0, ])
+            }
             return (ok)
+          }
           squeeze_rois = function(list1, list2) {
             rois = apply(t(1:nrow(list1)), 2, function(i){
               roi = list1[i,]
               roi2 = list2[i,]
               roi$begin = max(roi$begin, roi2$begin)
               roi$end = min(roi$end, roi2$end)
               roi$length =  roi$end - roi$begin + 1
               return(roi)
             })
             return(do.call(rbind, rois))
+          }
           # foo_orig = compute_inter_all_strain_curs2(config=config)
           # foo = foo_orig
           STOP = FALSE
           nb_round = 0
           while(!STOP) {
             nb_round = nb_round + 1
             print(paste("2-2 round #", nb_round, sep=""))
             fooby = translate_curs(foo, "BY", config=config)
             fooyjm = translate_curs(foo, "YJM", config=config)
             fooyjmby = translate_curs(fooyjm, "BY", config=config)
             if (!is_it_ok(fooby, fooyjmby)) {
               print("case 1")
               foo = squeeze_rois(fooby, fooyjmby)
           		next
+            }
             foorm = translate_curs(foo, "RM", config=config)
             foormby = translate_curs(foorm, "BY", config=config)
             if (!is_it_ok(fooby, foormby)) {
               print("case 2")
               foo = squeeze_rois(fooby, foormby)
           		next
+            }
             fooyjmrm = translate_curs(fooyjm, "RM", config=config)
             fooyjmrmyjm = translate_curs(fooyjmrm, "YJM", config=config)
             if (!is_it_ok(fooyjm, fooyjmrmyjm)) {
               print("case 3")
               foo = squeeze_rois(fooyjm, fooyjmrmyjm)
               next
+            }
             foormyjm = translate_curs(foorm, "YJM", config=config)
             foormyjmrm = translate_curs(foormyjm, "RM", config=config)
             if (!is_it_ok(foorm, foormyjmrm)) {
               print("case 4")
               foo = squeeze_rois(foorm, foormyjmrm)
               next
+            }
             foo = translate_curs(foo, "BY", config=config)
             STOP = TRUE
+          }
           STOP = FALSE
           nb_round = 0
           while(!STOP) {
             nb_round = nb_round + 1
             print(paste("3-3 round #", nb_round, sep=""))
             fooby = translate_curs(foo, "BY", config=config)
             foobyrm = translate_curs(fooby, "RM", config=config)
             foobyrmyjm = translate_curs(foobyrm, "YJM", config=config)
             foobyrmyjmby = translate_curs(foobyrmyjm, "BY", config=config)
             if (!is_it_ok(fooby, foobyrmyjmby)) {
               print("case 1")
               foo = squeeze_rois(fooby, foobyrmyjmby)
+            }
             fooby = translate_curs(foo, "BY", config=config)
             foobyyjm = translate_curs(fooby, "YJM", config=config)
             foobyyjmrm = translate_curs(foobyyjm, "RM", config=config)
             foobyyjmrmby = translate_curs(foobyyjmrm, "BY", config=config)
             if (!is_it_ok(fooby, foobyyjmrmby)) {
               print("case 2")
               foo = squeeze_rois(fooby, foobyyjmrmby)
               next
+            }
             foo = translate_curs(foo, "BY", config=config)
             STOP = TRUE
+          }
           print("end")
           return(foo)
+        }
         get_inter_strain_rois = function(strain1, strain2, diff_allowed = 30, min_cur_width = 200, config=NULL) {
           c2c = c2c_extraction(strain1, strain2, config=config)
           # computing diffs
           diff = c2c$V2[-1] - c2c$V3[-length(c2c$V2)]
           diff2 = c2c$V9[-1] - c2c$V10[-length(c2c$V2)]
           # Filtering
         	indexes_stop = which(abs(diff) > diff_allowed | abs(diff2) > diff_allowed)
         	indexes_start = c(1, indexes_stop[-length(indexes_stop)] + rep(1, length(indexes_stop) -1))
           rois = apply(t(1:length(indexes_start)), 2, function(i) {
             if ( i %% 20 == 1) print(paste(i, "/", length(indexes_start)))
             returned_rois = NULL
         		start = indexes_start[i]
         		stop = indexes_stop[i]
         		sub_c2c = c2c[start:stop,]
             check_homogeneity(sub_c2c)
         		if (strain1 == "BY") {
         			chr = ROM2ARAB()[[substr(sub_c2c[1,]$V1,4,10)]]
         		} else {
         			chr = config$FASTA_INDEXES[[strain1]][[sub_c2c[1,]$V1]]
+        		}
         		roi = list(chr=chr, begin=min(c(sub_c2c$V2,sub_c2c$V3)), end=max(c(sub_c2c$V2,sub_c2c$V3)), strain_ref=strain1)
         		roi$length = roi$end - roi$begin + 1
         		if (roi$length >= min_cur_width) {
         			lower_bound = roi$begin
         			upper_bound = roi$end
               check = check_overlaping(strain1, strain2, chr, lower_bound, upper_bound, config=config)
               while(!is.null(check)) {
                 # print(check)
             		roi1 = roi
                 roi1$end = check[[1]]
             		roi1$length = roi1$end - roi1$begin + 1
             		if (roi1$length >= min_cur_width) {
                   returned_rois = dfadd(returned_rois,roi1)
+                }
                 roi$begin = check[[2]]
             		roi$length = roi$end - roi$begin + 1
             		if (roi$length >= min_cur_width) {
             			lower_bound = min(roi$begin, roi$end)
             			upper_bound = max(roi$begin, roi$end)
                   check = check_overlaping(strain1, strain2, chr, lower_bound, upper_bound, config=config)
                 } else {
                   check = NULL
                   roi = NULL
+                }
+              }
               returned_rois = dfadd(returned_rois,roi)
+        	  }
           })
           rois = do.call(rbind,rois)
           rois = rois[order(as.numeric(rois$chr), rois$begin), ]
         	return(rois)
+        }
         translate_curs = function(rois, target_strain, config) {
           tr_rois = apply(t(1:nrow(rois)), 2, function(i){
             roi = rois[i,]
             tr_roi = translate_cur(roi, target_strain, config=config)
             tmp_begin = min(tr_roi$begin, tr_roi$end)
             tmp_end = max(tr_roi$begin, tr_roi$end)
             tr_roi$begin = tmp_begin
             tr_roi$end = tmp_end
             tr_roi$length =  tr_roi$end - tr_roi$begin + 1
             return(tr_roi)
           })
           tr_rois = do.call(rbind, tr_rois)
           return(tr_rois)
+        }
         combis = list(c("BY", "RM"), c("BY", "YJM"), c("RM", "YJM"))
         rois = list()
         for (combi in combis) {
           strain1 = combi[1]
           strain2 = combi[2]
           print(paste(strain1, strain2))
           rois_fwd = get_inter_strain_rois(strain1, strain2, min_cur_width = min_cur_width, diff_allowed = diff_allowed, config=config)
           strain1 = combi[2]
           strain2 = combi[1]
           print(paste(strain1, strain2))
           rois_rev = get_inter_strain_rois(strain1, strain2, min_cur_width = min_cur_width, diff_allowed = diff_allowed, config=config)
           tr_rois_rev = translate_curs(rois_rev, combi[1], config)
           region1 = rois_fwd
           region2 = tr_rois_rev
           rois[[paste(combi[1], combi[2], sep="_")]] = intersect_region(rois_fwd, tr_rois_rev)
+        }
         reducted_1_rois = intersect_region(rois[["BY_RM"]], rois[["BY_YJM"]])
         reducted_1_rois = reducted_1_rois[reducted_1_rois$length >= min_cur_width, ]
         tr_reducted_1_rois = translate_curs(reducted_1_rois, "RM", config)
         reducted_2_rois = intersect_region(tr_reducted_1_rois, rois[["RM_YJM"]])
         reducted_2_rois = reducted_2_rois[reducted_2_rois$length >= min_cur_width, ]
         reducted_rois = translate_curs(reducted_2_rois, "BY", config)
         reducted_rois = reducted_rois[order(as.numeric(reducted_rois$chr), reducted_rois$begin), ]
         squeezed_rois = test_and_squeeze_rois(reducted_rois, config=config)
         return (squeezed_rois)
+      }
       intersect_region = function(# Returns the intersection of 2 list on regions.
       ### This function...
       region1, ##<< Original regions.
       region2 ##<< Regions to intersect.
       ) {
         intersection = apply(t(1:nrow(region1)), 2, function(i) {
           roi1 = region1[i, ]
           sub_regions2 = region2[region2$chr == roi1$chr, ]
           sub_regions2 = sub_regions2[roi1$begin <= sub_regions2$begin & sub_regions2$begin <= roi1$end |
                                       roi1$begin <= sub_regions2$end & sub_regions2$end <= roi1$end |
                                       sub_regions2$begin < roi1$begin  & roi1$end < sub_regions2$end
                                       , ]
           if (nrow(sub_regions2) == 0) {
             print("removing a region")
             return(NULL)
           } else if (nrow(sub_regions2) > 1) {
             print("more than one region in intersect_region")
             return(do.call(rbind, apply(t(1:nrow(sub_regions2)), 2, function(i) {intersect_region(roi1, sub_regions2[i,])})))
           } else {
             roi2 = sub_regions2[1,]
             if (roi1$begin < roi2$begin) {
               print("not the same begin")
               roi1$begin = roi2$begin
               roi1$length =  roi1$end - roi1$begin + 1
+            }
             if (roi1$end > roi2$end) {
               print("not the same end")
               roi1$end = roi2$end
               roi1$length =  roi1$end - roi1$begin + 1
+            }
             return(roi1)
+          }
         })
         return(do.call(rbind,intersection))
+      }
       build_replicates = structure(function(# Stage replicates data
       ### This function loads in memory data corresponding to the given experiments.
       expe, ##<< a list of vector corresponding to vector of replicates.
       roi, ##<< the region that we are interested in.
       only_fetch=FALSE, ##<< filter or not inputs.
       get_genome=FALSE,##<< Load or not corresponding genome.
       all_samples, ##<< Global list of samples.
       config=NULL ##<< GLOBAL config variable.
       ) {
         build_samples = function(samples_ids, roi, only_fetch=FALSE, get_genome=TRUE, get_ouputs=TRUE, all_samples) {
         	samples=list()
         	for (i in samples_ids) {
         		sample = as.list(all_samples[all_samples$id==i,])
             sample$orig_roi = roi
             sample$roi = translate_cur(roi, sample$strain, config = config)
         		if (get_genome) {
         			# Get Genome
         			fasta_ref_filename = config$FASTA_REFERENCE_GENOME_FILES[[sample$strain]]
         			sample$roi$genome = get_content(fasta_ref_filename, "fasta")[[switch_pairlist(config$FASTA_INDEXES[[sample$strain]])[[sample$roi$chr]]]][sample$roi$begin:sample$roi$end]
+        		}
         		# Get inputs
         		sample_inputs_filename = paste(config$ALIGN_DIR, "/TF/sample_", i, "_TF.txt", sep="")
         		sample$inputs = get_content(sample_inputs_filename, "table", stringsAsFactors=FALSE)
         		sample$total_reads = sum(sample$inputs[,4])
         		if (!only_fetch) {
         		  sample$inputs = filter_tf_inputs(sample$inputs, sample$roi$chr, min(sample$roi$begin, sample$roi$end), max(sample$roi$begin, sample$roi$end), 300, filter_for_coverage=TRUE)
+        	  }
         	  # Get TF outputs for Mnase_Seq samples
         		if (sample$marker == "Mnase_Seq" & get_ouputs) {
         			sample_outputs_filename = paste(config$ALIGN_DIR, "/TF/sample_", i, "_all_nucs.tab", sep="")
         			sample$outputs = get_content(sample_outputs_filename, "table", header=TRUE, sep="\t")
         			if (!only_fetch) {
         	  		sample$outputs = filter_tf_outputs(sample$outputs, sample$roi$chr,  min(sample$roi$begin, sample$roi$end), max(sample$roi$begin, sample$roi$end), 300)
+          		}
+        		}
         		samples[[length(samples) + 1]] = sample
+        	}
         	return(samples)
+        }
       	replicates = list()
       	for(samples_ids in expe) {
       		samples = build_samples(samples_ids, roi, only_fetch=only_fetch, get_genome=get_genome, all_samples=all_samples)
       		replicates[[length(replicates) + 1]] = samples
+      	}
       	return(replicates)
         }, ex = function() {
           # library(rjson)
           # library(nucleominer)
+          #
           # # Read config file
           # json_conf_file = "nucleo_miner_config.json"
           # config = fromJSON(paste(readLines(json_conf_file), collapse=""))
           # # Read sample file
           # all_samples = get_content(config$CSV_SAMPLE_FILE, "cvs", sep=";", head=TRUE, stringsAsFactors=FALSE)
           # # here are the sample ids in a list
           # expes = list(c(1))
           # # here is the region that we wnt to see the coverage
           # cur = list(chr="8", begin=472000, end=474000, strain_ref="BY")
           # # it displays the corverage
           # replicates = build_replicates(expes, cur, all_samples=all_samples, config=config)
           # out = watch_samples(replicates, config$READ_LENGTH,
           #       plot_coverage = TRUE,
           #       plot_squared_reads = FALSE,
           #       plot_ref_genome = FALSE,
           #       plot_arrow_raw_reads = FALSE,
           #       plot_arrow_nuc_reads = FALSE,
           #       plot_gaussian_reads = FALSE,
           #       plot_gaussian_unified_reads = FALSE,
           #       plot_ellipse_nucs = FALSE,
           #       plot_wp_nucs = FALSE,
           #       plot_wp_nuc_model = FALSE,
           #       plot_common_nucs = FALSE,
           #       height = 50)
         })
       watch_samples = function(# Watching analysis of samples
       ### This function allows to view analysis for a particuler region of the genome.
       replicates, ##<< replicates under the form...
       read_length, ##<< length of the reads
       plot_ref_genome = TRUE, ##<< Plot (or not) reference genome.
       plot_arrow_raw_reads = TRUE,  ##<< Plot (or not) arrows for raw reads.
       plot_arrow_nuc_reads = TRUE,  ##<< Plot (or not) arrows for reads aasiocied to a nucleosome.
       plot_squared_reads = TRUE,  ##<< Plot (or not) reads in the square fashion.
       plot_coverage = FALSE,  ##<< Plot (or not) reads in the covergae fashion. fashion.
       plot_gaussian_reads = TRUE,  ##<< Plot (or not) gaussian model of a F anf R reads.
       plot_gaussian_unified_reads = TRUE,  ##<< Plot (or not) gaussian model of a nuc.
       plot_ellipse_nucs = TRUE,  ##<< Plot (or not) ellipse for a nuc.
       change_col = TRUE, ##<< Change the color of each nucleosome.
       plot_wp_nucs = TRUE,  ##<< Plot (or not) cluster of nucs
       plot_fuzzy_nucs = TRUE,  ##<< Plot (or not) cluster of fuzzy
       plot_wp_nuc_model = TRUE,  ##<< Plot (or not) gaussian model for a cluster of nucs
       plot_common_nucs = FALSE,  ##<< Plot (or not) aligned reads.
       plot_common_unrs = FALSE,  ##<< Plot (or not) unaligned nucleosomal refgions (UNRs).
       plot_wp_nucs_4_nonmnase = FALSE,  ##<< Plot (or not) clusters for non inputs samples.
       plot_chain = FALSE,  ##<< Plot (or not) clusterised nuceosomes between mnase samples.
       plot_sample_id = FALSE, ##<<  Plot (or not) the sample id for each sample.
       aggregated_intra_strain_nucs = NULL, ##<< list of aggregated intra strain nucs. If NULL, it will be computed.
       aligned_inter_strain_nucs = NULL, ##<< list of aligned inter strain nucs. If NULL, it will be computed.
       height = 10, ##<< Number of reads in per million read for each sample, graphical parametre for the y axis.
       main=NULL, ##<< main title of the produced plot
       xlab=NULL, ##<< xlab of the produced plot
       ylab="#reads (per million reads)", ##<< ylab of the produced plot
       config=NULL ##<< GLOBAL config variable
       ){
         returned_list = list()
         # Computing global display parameters
         if (replicates[[1]][[1]]$roi[["begin"]] < replicates[[1]][[1]]$roi[["end"]]) {
       	  x_min_glo = replicates[[1]][[1]]$roi[["begin"]]
       	  x_max_glo = replicates[[1]][[1]]$roi[["end"]]
         } else {
       	  x_min_glo = - replicates[[1]][[1]]$roi[["begin"]]
       	  x_max_glo = - replicates[[1]][[1]]$roi[["end"]]
+        }
       	base_glo = 0
       	nb_rank_glo = 0
         for (samples in replicates) {
         	nb_rank_glo = nb_rank_glo + length(samples)
+        }
       	ylim_glo = c(base_glo, base_glo + height * nb_rank_glo)
       	y_min_glo = min(ylim_glo)
       	y_max_glo = max(ylim_glo)
         delta_y_glo = y_max_glo - y_min_glo
         # Plot main frame
         if (is.null(xlab)) {
           xlab = paste("Ref strain:", replicates[[1]][[1]]$strain, "chr: ", replicates[[1]][[1]]$roi$chr)
+        }
         plot(c(x_min_glo,x_max_glo), c(0,0), ylim=ylim_glo, col=0, yaxt="n", ylab=ylab, xlab=xlab, main=main )
         axis(2, at=0:(nb_rank_glo*2) * delta_y_glo / (nb_rank_glo*2), labels=c(rep(c(height/2,0),nb_rank_glo),height/2))
         # Go
       	replicates_wp_nucs = list()
         wp_maps = list()
         fuzzy_maps = list()
         for (replicate_rank in 1:length(replicates)) {
       		# Computing replicate parameters
       		nb_rank = length(samples)
       		base = (replicate_rank-1) * height * nb_rank
       		ylim = c(base, base + height * nb_rank)
       		y_min = min(ylim)
       		y_max = max(ylim)
       	  delta_y = y_max - y_min
       		samples = replicates[[replicate_rank]]
       		for (sample_rank in 1:length(samples)) {
       			# computing sample parameters
       			sample = samples[[sample_rank]]
       			y_lev = y_min + (sample_rank - 0.5) * delta_y/nb_rank
             if (plot_sample_id) {
         			text(x_min_glo, y_lev + height/2 - delta_y_glo/100, labels=paste("(",sample$id,") ",sample$strain, " ", sample$marker, sep=""))
+            }
       		  if (sample$roi[["begin"]] < sample$roi[["end"]]) {
       			  x_min = sample$roi[["begin"]]
       			  x_max = sample$roi[["end"]]
       		  } else {
       			  x_min = - sample$roi[["begin"]]
       			  x_max = - sample$roi[["end"]]
+      		  }
       			shift = x_min_glo - x_min
       	    # Plot Genome seq
       			if (plot_ref_genome) {
       		  	text(1:length(sample$roi$genome) + x_min - 1 + shift, rep(y_lev - height/2, length(sample$roi$genome)), labels=toupper(sample$roi$genome), cex=dev.size()[1]*9/(x_max-x_min), family="Courier")
+      		  }
       			# Plot reads
       			reads = sample$inputs
       			signs = sign_from_strand(reads[,3])
       			if (plot_arrow_raw_reads) {
       				arrows(sign(x_min) * reads[,2] + shift, sign(x_min) * signs * reads[,4] * 1000000/sample$total_reads + y_lev, sign(x_min) * (reads[,2] + signs * read_length) + shift, sign(x_min) * signs * reads[,4] * 1000000/sample$total_reads + y_lev,
       				col=1, length=0.15/nb_rank)
+      			}
       	    if (plot_squared_reads) {
               # require(plotrix)
       				rect(sign(x_min) * reads[,2] + shift, rep(y_lev,length(reads[,1])), sign(x_min) * (reads[,2] + signs * read_length) + shift,  y_lev + sign(x_min) * signs * reads[,4] * 1000000/sample$total_reads, col=adjustcolor(1, alpha.f = 0.1),border=0)
+      			}
       	    if (plot_coverage) {
               if (length(reads[,1]) != 0) {
                 step_h = sign(x_min) * signs * reads[,4]
                 step_b = sign(x_min) * reads[,2] + shift
                 step_e = sign(x_min) * (reads[,2] + signs * 150) + shift
                 steps_x = min(step_b, step_e):max(step_b, step_e)
                 steps_y = rep(0, length(steps_x))
                 for (i in 1:length(step_h)) {
                   steps_y[which(steps_x==min(step_b[i], step_e[i]))] =  steps_y[which(steps_x==min(step_b[i], step_e[i]))] + abs(step_h[i])
                   steps_y[which(steps_x==max(step_b[i], step_e[i]))] =  steps_y[which(steps_x==max(step_b[i], step_e[i]))] - abs(step_h[i])
+                }
                 tmp_index = which(steps_y != 0)
                 steps_x = steps_x[tmp_index]
                 steps_y = steps_y[tmp_index]
                 tmp_current_level = 0
                 for (i in 1:length(steps_y)) {
                   steps_y[i] = tmp_current_level + steps_y[i]
                   tmp_current_level = steps_y[i]
+                }
                 steps_y = c(0, steps_y)
                 steps_y = steps_y * 1000000/sample$total_reads
               } else {
                 steps_y = c(0, 0, 0)
                 steps_x = c(x_min, x_max)
+              }
               # print(steps_x)
               # print(steps_y)
               lines(stepfun(steps_x, steps_y + y_lev), pch="")
               abline(y_lev,0)
               returned_list[[paste("cov", sample$id, sep="_")]] = stepfun(steps_x, steps_y)
+      			}
       			# Plot nucs
       	    if (sample$marker == "Mnase_Seq" & (plot_squared_reads | plot_gaussian_reads | plot_gaussian_unified_reads | plot_arrow_nuc_reads)) {
       				nucs = sample$outputs
       				if (length(nucs$center) > 0) {
       					col = 1
       		      for (i in 1:length(nucs$center)) {
                   foo<<-nucs
                   if (change_col) {
         						col = col + 1
                     } else {
                       col = "blue"
+                    }
       		        nuc = nucs[i,]
       						involved_reads = filter_tf_inputs(reads, sample$roi$chr, nuc$lower_bound, nuc$upper_bound, nuc_width = nuc$width)
       				  	involved_signs = apply(t(involved_reads[,3]), 2, function(strand) {	if (strand == "F") return(1) else return(-1)})
       						total_involved_reads = sum(involved_reads[,4])
       						if (plot_arrow_nuc_reads ) {
       							arrows(sign(x_min) * involved_reads[,2] + shift, sign(x_min) * involved_signs * involved_reads[,4] * 1000000/sample$total_reads + y_lev, sign(x_min) * (involved_reads[,2] + involved_signs * read_length) + shift, sign(x_min) * involved_signs * involved_reads[,4] * 1000000/sample$total_reads + y_lev,
       							col=col, length=0.15/nb_rank)
+      						}
       	          if (plot_gaussian_reads | plot_gaussian_unified_reads) {
         						flatted_reads = flat_reads(involved_reads, nuc$width)
       	  					delta_x = (nuc$center - nuc$width):(nuc$center + nuc$width)
+      		  			}
       	          if (plot_gaussian_reads ) {
       							flatted_reads = flat_reads(involved_reads, nuc$width)
       							delta_x = (nuc$center - nuc$width):(nuc$center + nuc$width)
       							lines(sign(x_min) * delta_x + shift, dnorm(delta_x, mean(flatted_reads[[1]]), sd(flatted_reads[[1]])) * length(flatted_reads[[1]]) * sign(x_min) * height/5 + y_lev, col=col)
       							lines(sign(x_min) * delta_x + shift, dnorm(delta_x, mean(flatted_reads[[2]]), sd(flatted_reads[[2]])) * length(flatted_reads[[2]]) * -1 * sign(x_min) * height/5 + y_lev, col=col)
+      	          }
       	          if (plot_gaussian_unified_reads ) {
       							lines(sign(x_min) * delta_x + shift, dnorm(delta_x, mean(flatted_reads[[3]]), sd(flatted_reads[[3]])) * length(flatted_reads[[3]]) * height/5 + y_lev, col=col, lty=1)
+      	          }
       	          if (plot_ellipse_nucs) {
       				      # require(plotrix)
       	  	 				draw.ellipse(sign(x_min) * nuc$center + shift, y_lev, nuc$width/2, total_involved_reads/nuc$width * height/5, border=col)
+      						}
+      		      }
       		    } else {
       		      print("WARNING! No nucs to print.")
+      		    }
+      			}
+      	  }
       	  # Plot wp nucs
       		if ((plot_wp_nucs_4_nonmnase | sample$marker == "Mnase_Seq") & (plot_wp_nucs | plot_fuzzy_nucs | plot_common_nucs | plot_chain)) {
       			if (samples[[1]]$marker == "Mnase_Seq") {
       				if (is.null(aggregated_intra_strain_nucs)) {
       	  			wp_nucs = aggregate_intra_strain_nucs(samples)[[1]]
       				} else {
       					wp_nucs = aggregated_intra_strain_nucs[[replicate_rank]]
+      				}
       		  } else {
         			wp_nucs = replicates_wp_nucs[[replicate_rank-2]]
+      		  }
             if (plot_chain) {
               tf_nucs = lapply(wp_nucs, function(nuc) {
                 bar = apply(t(nuc$nucs), 2, function(tmp_nuc){
                   tmp_nuc = tmp_nuc[[1]]
                   tmp_nuc$inputs = NULL
                   tmp_nuc$original_reads = NULL
                   tmp_nuc$wp = nuc$wp
                   # print(tmp_nuc)
                   return(tmp_nuc)
                 })
                 return(do.call(rbind, bar))
               })
               tf_nucs = data.frame(do.call(rbind, tf_nucs))
               tmp_x = (unlist(tf_nucs$lower_bound) + unlist(tf_nucs$upper_bound)) / 2
               tmp_y =  y_min + (unlist(tf_nucs$track) - 0.5) * delta_y/nb_rank
               tmp_y_prev = tmp_y[-length(tmp_y)]
               tmp_y_next = tmp_y[-1]
               tmp_y_inter = (tmp_y_prev + tmp_y_next) / 2
               tmp_track = unlist(tf_nucs$track)
               tmp_track_prev = tmp_track[-length(tmp_track)]
               tmp_track_next = tmp_track[-1]
               # tmp_track_inter = signif(tmp_track_prev - tmp_track_next) * (abs(tmp_track_prev - tmp_track_next) > 1) * 25
               if (is.null(config$TRACK_LOD_OFFSET)) {
                 config$TRACK_LOD_OFFSET = 0
+              }
               tmp_track_inter = signif(tmp_track_prev - tmp_track_next) + config$TRACK_LOD_OFFSET * 25
               tmp_x_prev = tmp_x[-length(tmp_x)]
               tmp_x_next = tmp_x[-1]
               need_shift = apply(t(tmp_x_next - tmp_x_prev), 2, function(delta){ delta < 50})
               tmp_x_inter = (tmp_x_prev + tmp_x_next) / 2 + tmp_track_inter * need_shift
               tmp_llr_inter =signif(unlist(tf_nucs$llr_score)[-1], 2)
               new_tmp_x = c()
               new_tmp_y = c()
               index_odd = 1:length(tmp_x) * 2 - 1
               index_even = (1:(length(tmp_x) - 1)) * 2
               new_tmp_x[index_odd] = tmp_x
               new_tmp_y[index_odd] = tmp_y
               new_tmp_x[index_even] = tmp_x_inter
               new_tmp_y[index_even] = tmp_y_inter
               lines(new_tmp_x , new_tmp_y, lwd=2)
               points(tmp_x, tmp_y, cex=4, pch=16, col="white")
               points(tmp_x, tmp_y, cex=4, lwd=2)
               text(tmp_x, tmp_y, 1:nrow(tf_nucs))
               if (is.null(config$LEGEND_LOD_POS)) {
                 pos = 2
               } else {
                 pos = config$LEGEND_LOD_POS
+              }
               col_llr = sapply(tmp_llr_inter, function(llr){if (llr < 20 ) return("green") else return("red")})
               text(tmp_x_inter, tmp_y_inter, tmp_llr_inter, cex=1.5, pos=pos, col=col_llr)
+            }
             if (plot_wp_nucs | plot_fuzzy_nucs | plot_common_nucs ) {
           		replicates_wp_nucs[[replicate_rank]] = wp_nucs
               strain = samples[[1]]$strain
               wp_maps[[strain]] = flat_aggregated_intra_strain_nucs(wp_nucs, "foo")
               fuzzy_maps[[strain]] = get_intra_strain_fuzzy(wp_maps[[strain]], as.list(samples[[1]]$roi), samples[[1]]$strain, config=config)
               if (plot_fuzzy_nucs) {
                 fuzzy_map = fuzzy_maps[[strain]]
                 if (!is.null(fuzzy_map)) {
                   if (nrow(fuzzy_map) > 0) {
                     rect(sign(x_min) * fuzzy_map$lower_bound + shift, y_min, sign(x_min) * fuzzy_map$upper_bound + shift, y_max, col=adjustcolor(3, alpha.f = 0.1), border=1)
+                  }
+                }
+              }
               if (plot_wp_nucs) {
           			for (wp_nuc in wp_nucs) {
           				if (wp_nuc$wp){
           					rect(sign(x_min) * wp_nuc$lower_bound + shift, y_min, sign(x_min) * wp_nuc$upper_bound + shift, y_max, col=adjustcolor(2, alpha.f = 0.1), border=1)
           					if (plot_wp_nuc_model) {
             					all_original_reads = c()
             					for(initial_nuc in wp_nuc$nucs) {
             						all_original_reads = c(all_original_reads, initial_nuc$original_reads)
+            					}
             					delta_x = wp_nuc$lower_bound:wp_nuc$upper_bound
           					  lines(sign(x_min) * delta_x + shift, dnorm(delta_x, mean(all_original_reads), sd(all_original_reads)) * length(all_original_reads) * height/5 + y_min, col=1)
+          				  }
+        				  }
+        				}
+        			}
+            }
+      		}
+      	}
       	if (plot_common_nucs) {
           if (is.null(aligned_inter_strain_nucs)) {
             aligned_inter_strain_nucs = align_inter_strain_nucs(replicates, replicates_wp_nucs[[1]], replicates_wp_nucs[[2]], config=config)[[1]]
             if (!is.null(aligned_inter_strain_nucs)) {
               aligned_inter_strain_nucs$cur_index = "foo"
+            }
+          }
           #Plot common wp nucs
           mid_y = shift = x_min = x_max = nb_rank = base = ylim = ymin = y_max = delta_y = list()
           for (replicate_rank in 1:length(replicates)) {
             nb_rank[[replicate_rank]] = length(samples)
             base[[replicate_rank]] = (replicate_rank-1) * height * nb_rank[[replicate_rank]]
             ylim[[replicate_rank]] = c(base[[replicate_rank]], base[[replicate_rank]] + height * nb_rank[[replicate_rank]])
             y_min[[replicate_rank]] = min(ylim[[replicate_rank]])
             y_max[[replicate_rank]] = max(ylim[[replicate_rank]])
             delta_y[[replicate_rank]] = y_max[[replicate_rank]] - y_min[[replicate_rank]]
             mid_y[[replicate_rank]] = (y_max[[replicate_rank]] + y_min[[replicate_rank]]) / 2
             samples = replicates[[replicate_rank]]
             for (sample_rank in 1:length(samples)) {
               sample = samples[[sample_rank]]
               y_lev = y_min[[replicate_rank]] + (sample_rank - 0.5) * delta_y[[replicate_rank]]/nb_rank[[replicate_rank]]
               if (sample$roi[["begin"]] < sample$roi[["end"]]) {
                 x_min[[replicate_rank]] = sample$roi[["begin"]]
                 x_max[[replicate_rank]] = sample$roi[["end"]]
               } else {
                 x_min[[replicate_rank]] = - sample$roi[["begin"]]
                 x_max[[replicate_rank]] = - sample$roi[["end"]]
+              }
               shift[[replicate_rank]] = x_min[[1]] - x_min[[replicate_rank]]
+            }
+          }
           print(aligned_inter_strain_nucs)
           if (!is.null(aligned_inter_strain_nucs)) {
             for (inter_strain_nuc_index in 1:length(aligned_inter_strain_nucs[,1])) {
               inter_strain_nuc = aligned_inter_strain_nucs[inter_strain_nuc_index,]
               tmp_xs = tmp_ys = c()
               for (replicate_rank in 1:length(replicates)) {
                 samples = replicates[[replicate_rank]]
                 strain = samples[[1]]$strain
                 tmp_xs = c(tmp_xs, sign(x_min[[replicate_rank]]) * (inter_strain_nuc[[paste("lower_bound_",strain,sep="")]] + inter_strain_nuc[[paste("upper_bound_",strain,sep="")]])/2 + shift[[replicate_rank]])
                 tmp_ys = c(tmp_ys, mid_y[[replicate_rank]])
+              }
               lines(tmp_xs, tmp_ys, col=2, type="b", lwd=dev.size()[1]*100/(x_max[[1]]-x_min[[1]])*8, cex=dev.size()[1]*400/(x_max[[1]]-x_min[[1]]), pch=19)
+            }
+          }
           if (plot_common_unrs) {
             combi = c(replicates[[1]][[1]]$strain, replicates[[2]][[1]]$strain)
             roi = as.list(samples[[1]]$roi)
             cur_index = "foo"
             common_nuc_results = list()
             common_nuc_results[[paste(combi[1], combi[2], sep="_")]] = aligned_inter_strain_nucs
             unrs = get_unrs(combi, roi, cur_index, wp_maps, fuzzy_maps, common_nuc_results, config = config)
             rect(sign(x_min[[1]]) * unrs$lower_bound + shift[[1]], y_min[[1]], sign(x_min[[1]]) * unrs$upper_bound + shift[[1]], y_max[[2]], border=4, lwd=10, col=adjustcolor(4, alpha.f = 0.05))
+          }
+      	}
         return(returned_list)
+      }
       get_intra_strain_fuzzy = function(# Compute the fuzzy list for a given strain.
       ### This function grabs the nucleosomes detxted by template_filter that have been rejected bt aggregate_intra_strain_nucs as well positions.
       wp_map, ##<< Well positionned nucleosomes map.
       roi, ##<< The region of interest.
       strain, ##<< The strain we want to extracvt the fuzzy map.
       config=NULL ##<< GLOBAL config variable.
       ) {
         fuzzy_map = wp_map[wp_map$wp==0, ]
         if (nrow(fuzzy_map) > 0) {
           fuzzy_map = substract_region(fuzzy_map, wp_map[wp_map$wp==1,])
           if (!is.null(fuzzy_map)) {
             fuzzy_map = union_regions(fuzzy_map)
             fuzzy_map = crop_fuzzy(fuzzy_map, roi, strain, config)
+          }
+        }
         return(fuzzy_map)
+      }
       get_unrs = function(# Compute the unaligned nucleosomal regions (UNRs).
       ### This function aggregate non common wp nucs for each strain and substract common wp nucs. It does not take care about the size of the resulting UNR. It will be take into account in the count read part og the pipeline.
       combi, ##<< The strain combination to consider.
       roi, ##<< The region of interest.
       cur_index, ##<< The region of interest index.
       wp_maps, ##<< Well positionned nucleosomes maps.
       fuzzy_maps, ##<< Fuzzy nucleosomes maps.
       common_nuc_results, ##<< Common wp nuc maps
       config=NULL ##<< GLOBAL config variable
       ) {
         # print(cur_index)
         tmp_combi_key = paste(combi[1], combi[2], sep="_")
         tmp_common_nucs = common_nuc_results[[tmp_combi_key]]
         tmp_common_nucs = tmp_common_nucs[tmp_common_nucs$cur_index == cur_index, ]
         # print(paste("Dealing with unr from", combi[1]))
         tmp_fuzzy = fuzzy_maps[[combi[1]]]
         tmp_fuzzy = tmp_fuzzy[tmp_fuzzy$cur_index == cur_index, ]
         tmp_wp = wp_maps[[combi[1]]]
         tmp_wp = tmp_wp[tmp_wp$wp==1,]
         tmp_wp = tmp_wp[tmp_wp$cur_index == cur_index, ]
         # Let's go!
         tmp_index = unlist(apply(t(tmp_wp$index_nuc), 2, function(index_nuc) {
           if (index_nuc %in% tmp_common_nucs[[paste("index_nuc", combi[1], sep="_")]]) {
             return(NULL)
           } else {
             return (index_nuc)
+          }
         }))
         tmp_unaligned_wp = tmp_wp[tmp_wp$index_nuc %in% tmp_index, ]
         tmp_unr = rbind(tmp_fuzzy,tmp_unaligned_wp[,1:4])
         if (length(tmp_unr) != 0) {
           tmp_unr = union_regions(tmp_unr)
+        }
         tmp_unr_nucs_1 = tmp_unr
         if (length(tmp_unr_nucs_1[,1]) == 0) {return(NULL)}
         agg_unr_1 = tmp_unr_nucs_1
         # print(paste("Dealing with unr from ", combi[2]))
         tmp_fuzzy = fuzzy_maps[[combi[2]]]
         tmp_fuzzy = tmp_fuzzy[tmp_fuzzy$cur_index == cur_index, ]
         tmp_wp = wp_maps[[combi[2]]]
         tmp_wp = tmp_wp[tmp_wp$wp==1,]
         tmp_wp = tmp_wp[tmp_wp$cur_index == cur_index, ]
         # Let's go!
         tmp_index = unlist(apply(t(tmp_wp$index_nuc), 2, function(index_nuc) {
           if (index_nuc %in% tmp_common_nucs[[paste("index_nuc", combi[2], sep="_")]]) {
             return(NULL)
           } else {
             return (index_nuc)
+          }
         }))
         tmp_unaligned_wp = tmp_wp[tmp_wp$index_nuc %in% tmp_index, ]
         tmp_unr = rbind(tmp_fuzzy,tmp_unaligned_wp[,1:4])
         if (length(tmp_unr) != 0) {
           tmp_unr = union_regions(tmp_unr)
+        }
         tmp_unr_nucs_2 = tmp_unr
         if (length(tmp_unr_nucs_2[,1]) == 0) {return(NULL)}
         agg_unr_2 = crop_fuzzy(tmp_unr_nucs_2, roi, combi[2], config)
         tr_agg_unr_2 = translate_regions(agg_unr_2, combi, cur_index, roi=roi, config=config)
         tr_agg_unr_2 = union_regions(tr_agg_unr_2)
         # print("Dealing with unr from both...")
         all_unr = union_regions(rbind(agg_unr_1, tr_agg_unr_2))
         # print(paste("Dealing with wp from", combi[1]))
         tmp_wp = wp_maps[[combi[1]]]
         tmp_wp = tmp_wp[tmp_wp$wp==1,]
         tmp_wp = tmp_wp[tmp_wp$cur_index == cur_index, ]
         # Let's go!
         tmp_index = unlist(apply(t(tmp_wp$index_nuc), 2, function(index_nuc) {
           if (index_nuc %in% tmp_common_nucs[[paste("index_nuc", combi[1], sep="_")]]) {
             return (index_nuc)
           } else {
             return(NULL)
+          }
         }))
         wp_nucs_1 = tmp_wp[tmp_wp$index_nuc %in% tmp_index, ]
         # print(paste("Dealing with wp from", combi[2]))
         tmp_wp = wp_maps[[combi[2]]]
         tmp_wp = tmp_wp[tmp_wp$wp==1,]
         tmp_wp = tmp_wp[tmp_wp$cur_index == cur_index, ]
         # Let's go!
         tmp_index = unlist(apply(t(tmp_wp$index_nuc), 2, function(index_nuc) {
           if (index_nuc %in% tmp_common_nucs[[paste("index_nuc", combi[2], sep="_")]]) {
             return (index_nuc)
           } else {
             return(NULL)
+          }
         }))
         wp_nucs_2 = tmp_wp[tmp_wp$index_nuc %in% tmp_index, ]
         wp_nucs_2 = crop_fuzzy(wp_nucs_2, roi, combi[2], config)
         if (nrow(wp_nucs_2) == 0) {
           tr_wp_nucs_2 = wp_nucs_2
         } else {
           tr_wp_nucs_2 = translate_regions(wp_nucs_2, combi, cur_index, roi=roi, config=config)
+        }
         # print("Dealing with wp from both...")
         all_wp = union_regions(rbind(wp_nucs_1[,1:4], tr_wp_nucs_2))
         # print("Dealing with unr and wp...")
         non_inter_unr = substract_region(all_unr, all_wp)
         non_inter_unr = crop_fuzzy(non_inter_unr, roi, combi[1], config)
         if (is.null(non_inter_unr)) { return(NULL) }
         non_inter_unr$len = non_inter_unr$upper_bound - non_inter_unr$lower_bound
         min_unr_width = 75
         non_inter_unr = non_inter_unr[non_inter_unr$len >= min_unr_width,]
         non_inter_unr$index_nuc = 1:length(non_inter_unr[,1])
         return (non_inter_unr)
+      }

LBMC » NucleoMiner

root / src / R / nucleominer.R @ ec2936ea