self.pathout = analyse.pathout
self.analyse = analyse
self.parametres = analyse.parametres
- self.scriptout = self.pathout['lastRscript.R']
+ #self.scriptout = ffr(self.pathout['lastRscript.R'])
+ self.scriptout = self.pathout['temp']
self.script = u"#Script genere par IRaMuTeQ - %s\n" % datetime.now().ctime()
-
+
def add(self, txt) :
self.script = '\n'.join([self.script, txt])
-
+
def defvar(self, name, value) :
self.add(' <- '.join([name, value]))
data1 <- as(data1, "dgCMatrix")
row.names(data1) <- 1:nrow(data1)
""" % ffr(DicoPath['TableUc1'])
-
+
if classif_mode == 0:
txt += """
data2 <- readMM("%s")
""" % ffr(DicoPath['TableUc2'])
txt += """
log1 <- "%s"
- chd1<-CHD(data1, x = nbt, mode.patate = mode.patate, svd.method = svd.method, libsvdc.path = libsvdc.path, log.file = log1)
+ #print('FIXME : source newCHD')
+ #source('/home/pierre/workspace/iramuteq/Rscripts/newCHD.R')
+ #chd1<-CHD(data1, x = nbt, mode.patate = mode.patate, svd.method = svd.method, libsvdc.path = libsvdc.path, find='matrix', sample=20, amp=500)
+ chd1<-CHD(data1, x = nbt, mode.patate = mode.patate, svd.method = svd.method, libsvdc.path = libsvdc.path)#, log.file = log1)
""" % ffr(DicoPath['log-chd1.txt'])
-
+
if classif_mode == 0:
txt += """
log2 <- "%s"
- chd2<-CHD(data2, x = nbt, mode.patate = mode.patate, svd.method = svd.method, libsvdc.path = libsvdc.path, log.file = log2)
+ chd2<-CHD(data2, x = nbt, mode.patate = mode.patate, svd.method =
+ svd.method, libsvdc.path = libsvdc.path)#, log.file = log2)
""" % ffr(DicoPath['log-chd2.txt'])
-
+
txt += """
#lecture des uce
listuce1<-read.csv2("%s")
""" % ffr(DicoPath['listeuce1'])
-
+
if classif_mode == 0:
txt += """
listuce2<-read.csv2("%s")
""" % ffr(DicoPath['listeuce2'])
-
+
txt += """
rm(data1)
"""
-
+
if classif_mode == 0:
txt += """
rm(data2)
txt += """
classif_mode <- %i
mincl <- %i
+ if (mincl == 0) {mincl <- round(nrow(chd1$n1)/(nbt+1))}
uceout <- "%s"
+ write.csv2(chd1$n1, file="%s")
if (classif_mode == 0) {
chd.result <- Rchdtxt(uceout, chd1, chd2 = chd2, mincl = mincl,classif_mode = classif_mode, nbt = nbt)
+ classeuce1 <- chd.result$cuce1
+ tree.tot1 <- make_tree_tot(chd1)
+ tree.cut1 <- make_dendro_cut_tuple(tree.tot1$dendro_tuple, chd.result$coord_ok, classeuce1, 1, nbt)
+
} else {
- chd.result <- Rchdtxt(uceout, chd1, chd2 = chd1, mincl = mincl,classif_mode = classif_mode, nbt = nbt)
+ #chd.result <- Rchdtxt(uceout, chd1, chd2 = chd1, mincl = mincl,classif_mode = classif_mode, nbt = nbt)
+ tree.tot1 <- make_tree_tot(chd1)
+ terminales <- find.terminales(chd1$n1, chd1$list_mere, chd1$list_fille, mincl)
+ tree.cut1 <- make.classes(terminales, chd1$n1, tree.tot1$tree.cl, chd1$list_fille)
+ write.csv2(tree.cut1$n1, uceout)
+ chd.result <- tree.cut1
}
- n1 <- chd.result$n1
- classeuce1 <- chd.result$cuce1
- classes<-n1[,ncol(n1)]
- write.csv2(n1, file="%s")
- rm(n1)
- """ % (classif_mode, mincl, ffr(DicoPath['uce']), ffr(DicoPath['n1.csv']))
-
+ classes<-chd.result$n1[,ncol(chd.result$n1)]
+ write.csv2(chd.result$n1, file="%s")
+ """ % (classif_mode, mincl, ffr(DicoPath['uce']), ffr(DicoPath['n1-1.csv']), ffr(DicoPath['n1.csv']))
+
txt += """
- tree.tot1 <- make_tree_tot(chd1)
+# tree.tot1 <- make_tree_tot(chd1)
# open_file_graph("%s", widt = 600, height=400)
# plot(tree.tot1$tree.cl)
# dev.off()
""" % ffr(DicoPath['arbre1'])
-
+
if classif_mode == 0:
txt += """
classeuce2 <- chd.result$cuce2
# open_file_graph("%s", width = 600, height=400)
# plot(tree.tot2$tree.cl)
# dev.off()
- """ % ffr(DicoPath['arbre2'] )
-
+ """ % ffr(DicoPath['arbre2'] )
+
txt += """
- tree.cut1 <- make_dendro_cut_tuple(tree.tot1$dendro_tuple, chd.result$coord_ok, classeuce1, 1, nbt)
- save(tree.cut1, file="%s")
-
+ save(tree.cut1, file="%s")
+
open_file_graph("%s", width = 600, height=400)
plot.dendropr(tree.cut1$tree.cl,classes, histo=TRUE)
open_file_graph("%s", width = 600, height=400)
plot(tree.cut1$dendro_tot_cl)
dev.off()
""" % (ffr(DicoPath['Rdendro']), ffr(DicoPath['dendro1']), ffr(DicoPath['arbre1']))
-
+
if classif_mode == 0:
txt += """
tree.cut2 <- make_dendro_cut_tuple(tree.tot2$dendro_tuple, chd.result$coord_ok, classeuce2, 2, nbt)
plot(tree.cut2$dendro_tot_cl)
dev.off()
""" % (ffr(DicoPath['dendro2']), ffr(DicoPath['arbre2']))
-
+
txt += """
-
+
#save.image(file="%s")
""" % (ffr(DicoPath['RData']))
-
+
fileout = open(DicoPath['Rchdtxt'], 'w')
fileout.write(txt)
fileout.close()
dataet<-read.csv2("%s", header = FALSE, sep = ';',quote = '\"', row.names = 1, na.strings = 'NA')
""" % (ffr(DictChdTxtOut['Contout']), ffr(DictChdTxtOut['ContSupOut']), ffr(DictChdTxtOut['ContEtOut']))
txt += """
-tablesqrpact<-BuildProf(as.matrix(dataact),n1,clnb)
-tablesqrpsup<-BuildProf(as.matrix(datasup),n1,clnb)
-tablesqrpet<-BuildProf(as.matrix(dataet),n1,clnb)
+print('ATTENTION NEW BUILD PROF')
+#tablesqrpact<-BuildProf(as.matrix(dataact),n1,clnb)
+#tablesqrpsup<-BuildProf(as.matrix(datasup),n1,clnb)
+#tablesqrpet<-BuildProf(as.matrix(dataet),n1,clnb)
+tablesqrpact<-new.build.prof(as.matrix(dataact),n1,clnb)
+tablesqrpsup<-new.build.prof(as.matrix(datasup),n1,clnb)
+tablesqrpet<-new.build.prof(as.matrix(dataet),n1,clnb)
+
"""
txt += """
PrintProfile(n1,tablesqrpact[4],tablesqrpet[4],tablesqrpact[5],tablesqrpet[5],clnb,"%s","%s",tablesqrpsup[4],tablesqrpsup[5])
else :
txt += """
word <- FALSE
+ index <- NULL
"""
txt += """
dm <-readMM(dm.path)
txt += """
mat <- graph.word(mat, index)
cs <- colSums(mat)
- if (length(cs)) mat <- mat[,-which(cs==0)]
+ if (length(which(cs==0))) mat <- mat[,-which(cs==0)]
rs <- rowSums(mat)
- if (length(rs)) mat <- mat[-which(rs==0),]
- if (length(cs)) dm <- dm[, -which(cs==0)]
+ if (length(which(rs==0))) mat <- mat[-which(rs==0),]
+ if (length(which(cs==0))) dm <- dm[,-which(cs==0)]
+ if (word) {
+ index <- which(colnames(mat)==forme)
+ }
"""
if self.parametres['layout'] == 0 : layout = 'random'
if self.parametres['layout'] == 2 : layout = 'frutch'
if self.parametres['layout'] == 3 : layout = 'kawa'
if self.parametres['layout'] == 4 : layout = 'graphopt'
+ if self.parametres['layout'] == 5 : layout = 'spirale'
+ if self.parametres['layout'] == 6 : layout = 'spirale3D'
self.filename=''
while os.path.exists(os.path.join(dirout,'web_'+str(graphnb))):
graphnb +=1
self.filename = ffr(os.path.join(dirout,'web_'+str(graphnb)))
- os.mkdir(self.filename)
+ os.mkdir(self.filename)
self.filename = os.path.join(self.filename, 'gexf.gexf')
if self.parametres['type_graph'] == 4 :
graphnb = 1
if self.parametres['film'] :
txt += """
film <- "%s"
- """ % self.pathout['film']
+ """ % ffr(self.pathout['film'])
else :
txt += """
film <- NULL
txt += """
eff <- colSums(dm)
x <- list(mat = mat, eff = eff)
- graph.simi <- do.simi(x, method='%s', seuil = seuil, p.type = '%s', layout.type = '%s', max.tree = %s, coeff.vertex=%s, coeff.edge = %s, minmaxeff = minmaxeff, vcexminmax = vcexminmax, cex = cex, coords = coords, communities = communities, halo = halo)
+ graph.simi <- do.simi(x, method='%s', seuil = seuil, p.type = '%s', layout.type = '%s', max.tree = %s, coeff.vertex=%s, coeff.edge = %s, minmaxeff = minmaxeff, vcexminmax = vcexminmax, cex = cex, coords = coords, communities = communities, halo = halo, index.word=index)
""" % (method, type, layout, arbremax, coeff_tv, coeff_te)
if self.parametres.get('bystar',False) :
"""
class MergeGraphes(PrintRScript) :
- def __init__(self, parametres):
+ def __init__(self, analyse):
self.script = u"#Script genere par IRaMuTeQ - %s\n" % datetime.now().ctime()
self.pathout = PathOut()
- self.parametres = parametres
+ self.parametres = analyse.parametres
self.scriptout = self.pathout['temp']
-
+ self.analyse = analyse
+
def make_script(self) :
#FIXME
-
+
txt = """
library(igraph)
library(Matrix)
V(g)$weight <- (graph.simi$mat.eff/nrow(dm))*100
graphs[['%s']] <- g
"""
- for i, graph in enumerate(self.parametres['lgraphes']) :
+ for i, graph in enumerate(self.parametres['graphs']) :
path = os.path.dirname(graph)
gname = ''.join(['g', `i`])
RData = os.path.join(path,'RData.RData')
dev.off()
""" % ffr(self.pathout['barplotrow.png'])
self.add(txt)
- self.write()
+ self.write()
+
+class LabbeScript(PrintRScript) :
+ def make_script(self) :
+ self.sources([self.analyse.parent.RscriptsPath['distance-labbe.R'],
+ self.analyse.parent.RscriptsPath['Rgraph']])
+ txt = """
+ tab <- read.csv2("%s", header=TRUE, sep=';', row.names=1)
+ """ % (ffr(self.pathout['tableafcm.csv']))
+ txt += """
+ dist.mat <- dist.labbe(tab)
+ dist.mat <- as.dist(dist.mat, upper=F, diag=F)
+ write.table(as.matrix(dist.mat), "%s", sep='\t')
+ library(cluster)
+ library(ape)
+ chd <- hclust(dist.mat, method="ward.D2")
+ open_file_graph("%s", width=1000, height=1000, svg=F)
+ par(cex=1.2)
+ plot.phylo(as.phylo(chd), type='unrooted', lab4ut="axial")
+ dev.off()
+ """ % (ffr(self.pathout['distmat.csv']), ffr(self.pathout['labbe-tree.png']))
+ txt +="""
+ open_file_graph("%s", width=1000, height=1000, svg=F)
+ par(mar=c(10,1,1,10))
+ heatmap(as.matrix(dist.mat), symm = T, distfun=function(x) as.dist(x), margins=c(10,10))
+ dev.off()
+ """ % ffr(self.pathout['labbe-heatmap.png'])
+ txt += """
+ #http://stackoverflow.com/questions/3081066/what-techniques-exists-in-r-to-visualize-a-distance-matrix
+ dst <- data.matrix(dist.mat)
+ dim <- ncol(dst)
+ rn <- row.names(as.matrix(dist.mat))
+ open_file_graph("%s", width=1500, height=1000, svg=F)
+ par(mar=c(10,10,3,3))
+ image(1:dim, 1:dim, dst, axes = FALSE, xlab="", ylab="")
+ axis(1, 1:dim, rn, cex.axis = 0.9, las=3)
+ axis(2, 1:dim, rn, cex.axis = 0.9, las=1)
+ text(expand.grid(1:dim, 1:dim), sprintf("%%0.2f", dst), cex=0.6)
+ dev.off()
+ """ % ffr(self.pathout['labbe-matrix.png'])
+ self.add(txt)
+ self.write()
+
+class ChronoChi2Script(PrintRScript) :
+ def make_script(self) :
+ self.sources([self.analyse.parent.RscriptsPath['Rgraph']])
+ print self.parametres
+ txt = """
+ inRData <- "%s"
+ dendrof <- "%s"
+ load(inRData)
+ load(dendrof)
+ """ % (ffr(self.pathout['RData.RData']), ffr(self.pathout['dendrogramme.RData']))
+ txt += """
+ svg <- %s
+ """ % self.parametres['svg']
+ txt += """
+ tc <- which(grepl("%s",rownames(chistabletot)))
+ rn <- rownames(chistabletot)[tc]
+ tc <- tc[order(rn)]
+ dpt <- chistabletot[tc,]
+ tot <- afctable[tc,]
+ tcp <- rowSums(tot)
+ ptc <- tcp/sum(tcp)
+ dpt <- t(dpt)
+ dd <- dpt
+ """ % self.parametres['var'].replace(u'*', u"\\\\*")
+ txt += """
+ classes <- n1[,ncol(n1)]
+ tcl <- table(classes)
+ if ('0' %in% names(tcl)) {
+ to.vire <- which(names(tcl) == '0')
+ tcl <- tcl[-to.vire]
+ }
+ tclp <- tcl/sum(tcl)
+
+ #chi2 colors
+ library(ape)
+ k <- 1e-02
+ lcol <- NULL
+ lk <- k
+ for (i in 1:5) {
+ lcol <- c(lcol, qchisq(1-k,1))
+ k <- k/10
+ lk <- c(lk,k)
+ }
+ lcol <- c(3.84, lcol)
+ lcol <- c(-Inf,lcol)
+ lcol <- c(lcol, Inf)
+ lk <- c(0.05,lk)
+ breaks <- lcol
+ alphas <- seq(0,1, length.out=length(breaks))
+ clod <- rev(as.numeric(tree.cut1$tree.cl$tip.label))
+ #end
+ """
+ txt += """
+ open_file_graph("%s", w=%i, h=%i, svg=svg)
+ """ % (ffr(self.parametres['tmpgraph']), self.parametres['width'], self.parametres['height'])
+ txt += """
+ par(mar=c(3,3,3,3))
+ mat.graphic <- matrix(c(rep(1,nrow(dd)),c(2:(nrow(dd)+1))), ncol=2)
+ mat.graphic <- rbind(mat.graphic, c(max(mat.graphic) + 1 , max(mat.graphic) + 2))
+ hauteur <- tclp[clod] * 0.9
+ heights.graphic <- append(hauteur, 0.1)
+ layout(mat.graphic, heights=heights.graphic, widths=c(0.15,0.85))
+ par(mar=c(0,0,0,0))
+ tree.toplot <- tree.cut1$tree.cl
+ num.label <- as.numeric(tree.cut1$tree.cl$tip.label)
+ col.tree <- rainbow(length(num.label))[num.label]
+ #tree.toplot$tip.label <- paste('classe ', tree.toplot$tip.label)
+ plot.phylo(tree.toplot,label.offset=0.1, cex=1.1, no.margin=T, tip.color = col.tree)
+ for (i in clod) {
+ print(i)
+ par(mar=c(0,0,0,0))
+ lcol <- cut(dd[i,], breaks, include.lowest=TRUE)
+ ulcol <- names(table(lcol))
+ lcol <- as.character(lcol)
+ for (j in 1:length(ulcol)) {
+ lcol[which(lcol==ulcol[j])] <- j
+ }
+ lcol <- as.numeric(lcol)
+ mcol <- rainbow(nrow(dd))[i]
+ last.col <- NULL
+ for (k in alphas) {
+ last.col <- c(last.col, rgb(r=col2rgb(mcol)[1]/255, g=col2rgb(mcol)[2]/255, b=col2rgb(mcol)[3]/255, a=k))
+ }
+ #print(last.col)
+
+ barplot(rep(1,ncol(dd)), width=ptc, names.arg=FALSE, axes=FALSE, col=last.col[lcol], border=rgb(r=0, g=0, b=0, a=0.3))
+ }
+ plot(0,type='n',axes=FALSE,ann=FALSE)
+ label.coords <- barplot(rep(1, ncol(dd)), width=ptc, names.arg = F, las=2, axes=F, ylim=c(0,1), plot=T, col='white')
+ text(x=label.coords, y=0.5, labels=rn[order(rn)], srt=90)
+ dev.off()
+ """
+ self.add(txt)
+ self.write()
+
+class ChronoPropScript(PrintRScript) :
+ def make_script(self) :
+ self.sources([self.analyse.parent.RscriptsPath['Rgraph']])
+ print self.parametres
+ txt = """
+ inRData <- "%s"
+ dendrof <- "%s"
+ load(inRData)
+ load(dendrof)
+ """ % (ffr(self.pathout['RData.RData']), ffr(self.pathout['dendrogramme.RData']))
+ txt += """
+ svg <- %s
+ """ % self.parametres['svg']
+ txt += """
+ tc <- which(grepl("%s",rownames(chistabletot)))
+ rn <- rownames(chistabletot)[tc]
+ tc <- tc[order(rn)]
+ dpt <- chistabletot[tc,]
+ tot <- afctable[tc,]
+ tcp <- rowSums(tot)
+ ptc <- tcp/sum(tcp)
+ dpt <- t(dpt)
+ dd <- dpt
+ """ % self.parametres['var'].replace(u'*', u"\\\\*")
+ txt += """
+ classes <- n1[,ncol(n1)]
+ tcl <- table(classes)
+ if ('0' %in% names(tcl)) {
+ to.vire <- which(names(tcl) == '0')
+ tcl <- tcl[-to.vire]
+ }
+ tclp <- tcl/sum(tcl)
+ """
+ txt += """
+ open_file_graph("%s", w=%i, h=%i, svg=svg)
+ """ % (ffr(self.parametres['tmpgraph']), self.parametres['width'], self.parametres['height'])
+ txt+= """
+ ptt <- prop.table(as.matrix(tot), 1)
+ par(mar=c(10,2,2,2))
+ barplot(t(ptt)[as.numeric(tree.cut1$tree.cl$tip.label),], col=rainbow(ncol(ptt))[as.numeric(tree.cut1$tree.cl$tip.label)], width=ptc, las=3, space=0.05, cex.axis=0.7, border=NA)
+ dev.off()
+ """
+ self.add(txt)
+ self.write()
+
+class ReDoProfScript(PrintRScript) :
+ def make_script(self) :
+ self.sources([self.analyse.parent.RscriptsPath['chdfunct.R']])
+ print self.parametres
+