annotate plotmatrix.py @ 13:292186c14b08

Uploaded
author xuebing
date Sat, 10 Mar 2012 08:17:36 -0500
parents b7f1d9f8f3bc
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
11
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
1 import sys,os
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
2
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
3 infile = sys.argv[1]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
4 outfile = sys.argv[2]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
5 uselog = sys.argv[3]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
6 subset = sys.argv[4]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
7 reorder = sys.argv[5]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
8 color = sys.argv[6]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
9 scale = sys.argv[7] # rescale each row
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
10 cols = sys.argv[8]
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
11 rscript = open('tmp.r','w')
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
12
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
13 rscript.write("x <- read.table('"+infile+"')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
14 rscript.write("x <- x[,c("+cols+")]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
15 rscript.write("nr <- nrow(x) \n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
16 rscript.write("nc <- ncol(x)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
17 rscript.write("rowsum <- apply(x,1,sum)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
18
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
19 if subset =='subset':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
20 rscript.write("if (nr*nc > 100000) {\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
21 rscript.write(" nr2 <- as.integer(100000/nc)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
22 rscript.write(" subind <- sample(seq(nr),nr2)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
23 rscript.write(" x <- x[subind,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
24 rscript.write(" rowsum <- rowsum[subind]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
25 rscript.write("}\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
26
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
27 rscript.write("pdf('"+outfile+"')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
28
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
29 if uselog == 'uselog':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
30 rscript.write("x <- -(log(as.matrix(x,nc=nc)))\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
31 else:
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
32 rscript.write("x <- -as.matrix(x,nc=nc)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
33 if scale == 'scale':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
34 rscript.write("x <- scale(x)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
35 if reorder == 'average':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
36 rscript.write("hc <- hclust(dist(x),method= 'average')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
37 rscript.write("x <- x[hc$order,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
38 elif reorder == 'centroid':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
39 rscript.write("hc <- hclust(dist(x),method= 'centroid')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
40 rscript.write("x <- x[hc$order,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
41 elif reorder == 'complete':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
42 rscript.write("hc <- hclust(dist(x),method= 'complete')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
43 rscript.write("x <- x[hc$order,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
44 elif reorder == 'single':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
45 rscript.write("hc <- hclust(dist(x),method= 'single')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
46 rscript.write("x <- x[hc$order,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
47 elif reorder == 'median':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
48 rscript.write("hc <- hclust(dist(x),method= 'median')\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
49 rscript.write("x <- x[hc$order,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
50 elif reorder == 'sort_by_total':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
51 rscript.write("srt <- sort(rowsum,index.return=T)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
52 rscript.write("x <- x[srt$ix,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
53 elif reorder == 'sort_by_center':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
54 rscript.write("srt <- sort(x[,as.integer(nc/2)],index.return=T)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
55 rscript.write("x <- x[srt$ix,]\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
56 if color == 'heat':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
57 rscript.write("colormap = heat.colors(1000)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
58 elif color == 'topo':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
59 rscript.write("colormap = topo.colors(1000)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
60 elif color == 'rainbow':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
61 rscript.write("colormap = rainbow(1000)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
62 elif color == 'terrain':
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
63 rscript.write("colormap = terrain.colors(1000)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
64 else:
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
65 rscript.write("colormap = gray.colors(1000)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
66
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
67 #rscript.write("qt <- quantile(as.vector(x),probs=c(0.1,0.9))\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
68 #rscript.write("breaks <- c(min(as.vector(x)),seq(qt[1],qt[2],length.out=99),max(as.vector(x)))\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
69 #rscript.write("image(t(x),col=colormap,breaks=breaks,axes=F)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
70 rscript.write("image(t(x),col=colormap,axes=F)\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
71 rscript.write("dev.off()\n")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
72
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
73 rscript.close()
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
74
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
75 os.system("R --slave < tmp.r")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
76 os.system("rm tmp.r")
b7f1d9f8f3bc Uploaded
xuebing
parents:
diff changeset
77