chipster.tools.path = '/opt/chipster/tools'
chipster.common.path = '/opt/chipster/comp/modules/common/R-2.12'
chipster.module.path = '/opt/chipster/comp/modules/microarray'
setwd("5e59598f-2138-4766-837c-2a0d130db70b")
filter.by.flag <- "P"
number.of.chips <- 9
# TOOL filter-flags.R: "Filter by flags" (Gene filtering using flags. If more than the specified number of chips have the specified flag for a particular gene, it passes the filter, and is saved in a new data set.)
# INPUT normalized.tsv: normalized.tsv TYPE GENE_EXPRS 
# OUTPUT call-filtered.tsv: call-filtered.tsv 
# PARAMETER filter.by.flag: filter.by.flag TYPE [P: P, M: M, A: A, A.or.M: A.or.M, M.or.P: M.or.P] DEFAULT P (Which flag to filter by)
# PARAMETER number.of.chips: number.of.chips TYPE INTEGER FROM 1 TO 10000 DEFAULT 2 (How many samples the should have the specified call value)


# Filtering using flags (calls)
# JTT 29.6.2006
#
# MG 14.9.2010
# Modified to allow filtering options for A or M and M or P

# Parameter settings (default) for testing purposes
#filter.by.flag<-c("P")
#number.of.chips<-c(9)

# Renaming variables
f1 <- filter.by.flag
f2 <- f1
if (filter.by.flag=="A.or.M") {
	f1 <- "A"
	f2 <- "M"
}
if (filter.by.flag=="M.or.P") {
	f1 <- "M"
	f2 <- "P"
}
p<-number.of.chips

# Loads the normalized data
file<-c("normalized.tsv")
dat<-read.table(file, header=T, sep="\t", row.names=1)

# Separates expression values and flags
calls<-dat[,grep("flag", names(dat))]
dat2<-dat[,grep("chip", names(dat))]

# Sanity checks
if(ncol(as.data.frame(calls))==0) {
	stop("CHIPSTER-NOTE: You do not have any flags!")
}
if(number.of.chips==0) {
	stop("CHIPSTER-NOTE: You must specify at least one array where the flag condition is fulfilled!")
}
if(number.of.chips>ncol(as.data.frame(calls))) {
	p <- ncol(as.data.frame(calls))
}

# Converting the data to data frames
dat2<-data.frame(dat2)
calls<-data.frame(calls)
len<-length(calls)

# Apply filtering
for(i in 1:len) {
	calls[,i]<-ifelse((calls[,i]==f1 | calls[,i]==f2) , 1, 0);
}
s<-apply(calls, MARGIN=1, FUN="sum")
dat2<-dat[which(s>=p),]

# Saving the results into a text file
write.table(dat2, "call-filtered.tsv", sep="\t", row.names=T, col.names=T, quote=F)
print("script-finished-succesfully")
