Mercurial > repos > testtool > geo_data
comparison getGRsetFromGEO/.Rhistory @ 11:983651783ce9 draft
Uploaded
author | testtool |
---|---|
date | Wed, 22 Mar 2017 09:01:06 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
10:cbc8174bd361 | 11:983651783ce9 |
---|---|
1 TAB <- read.csv("input.csv") | |
2 mysamples <- lapply(TAB$ID,function(x)getGEO(x)) | |
3 input <- function(TAB) { if(is(TAB, "csv")){ | |
4 TAB <- read.csv("input.csv")} | |
5 else{ | |
6 print("error in data file") | |
7 }} | |
8 input() | |
9 TAB <- read.csv("input.csv")} | |
10 TAB <- read.csv("input.csv") | |
11 test_func <- function( | |
12 clusterSize=2, | |
13 cutoff=0.2, | |
14 platform_id='HM450', | |
15 genome_id='hg19') | |
16 { | |
17 args = commandArgs(trailingOnly=TRUE) | |
18 methyl_file = args[1] | |
19 ChiPseq_file = args[2] | |
20 output_file = args[3] | |
21 options(warn=-1) | |
22 TAB=read.csv(methyl_file) | |
23 ChiPseq=import(ChiPseq_file) | |
24 if(is.null(TAB)){ | |
25 stop("Must specify input files") | |
26 }else{ | |
27 mysamples <- lapply(TAB$ID,function(x) getGEO(x)) | |
28 } | |
29 wrappedFunction <- function(test_func) | |
30 s0 <- lapply(mysamples,Table) | |
31 id_ref<-lapply(s0,function(x)x$ID_REF) | |
32 if(length(unique(id_ref)) != 1) { | |
33 stop("Error different ID_REF for samples") | |
34 } else if (is.null((unlist(unique(id_ref))))) { | |
35 stop("NO GSM data avaliable") | |
36 } else { | |
37 values<-do.call("cbind",lapply(s0,function(x)x$VALUE)) | |
38 colnames(values)=TAB$ID | |
39 rownames(values)=id_ref[[1]] | |
40 cg <- rownames(values) | |
41 probe <- c(cg) | |
42 hm450.hg19 <- getPlatform(platform=platform_id, genome=genome_id) | |
43 probe.info <- hm450.hg19[probe] | |
44 f <- data.table(probe=names(probe.info),CHR=as.data.frame(probe.info@seqnames)$value, | |
45 BP=as.numeric(probe.info@elementMetadata$probeStart)) | |
46 designMatrix <- model.matrix(~ TAB$Phenotype) | |
47 DMR <- bumphunter(values, design = designMatrix, | |
48 pos=f$BP,cutoff=cutoff,chr=f$CHR) | |
49 MAT <- DMR$table[which(DMR$table$L>=clusterSize),] | |
50 METH <- GRanges(seqnames=MAT$chr, | |
51 ranges=IRanges | |
52 (start=MAT$start, | |
53 end=MAT$end), | |
54 value_pos=MAT$value) | |
55 peaks<-findOverlapsOfPeaks(probe.info,ChiPseq,maxgap=5000) | |
56 p <- peaks$peaklist$`probe.info///ChiPseq` | |
57 peakAnno <- annotatePeak(p, file=peakAnno) | |
58 output_file <- annotatePeak(p, file=output_file) | |
59 }} | |
60 test_func <- function( | |
61 clusterSize=2, | |
62 cutoff=0.2, | |
63 platform_id='HM450', | |
64 genome_id='hg19') | |
65 { | |
66 args = commandArgs(trailingOnly=TRUE) | |
67 methyl_file = args[1] | |
68 ChiPseq_file = args[2] | |
69 output_file = args[3] | |
70 options(warn=-1) | |
71 TAB=read.csv(methyl_file) | |
72 ChiPseq=import(ChiPseq_file) | |
73 if(is.null(TAB)){ | |
74 stop("Must specify input files") | |
75 }else{ | |
76 mysamples <- lapply(TAB$ID,function(x) getGEO(x)) | |
77 } | |
78 wrappedFunction <- function(test_func) | |
79 s0 <- lapply(mysamples,Table) | |
80 id_ref<-lapply(s0,function(x)x$ID_REF) | |
81 if(length(unique(id_ref)) != 1) { | |
82 stop("Error different ID_REF for samples") | |
83 } else if (is.null((unlist(unique(id_ref))))) { | |
84 stop("NO GSM data avaliable") | |
85 } else { | |
86 values<-do.call("cbind",lapply(s0,function(x)x$VALUE)) | |
87 colnames(values)=TAB$ID | |
88 rownames(values)=id_ref[[1]] | |
89 cg <- rownames(values) | |
90 probe <- c(cg) | |
91 hm450.hg19 <- getPlatform(platform=platform_id, genome=genome_id) | |
92 probe.info <- hm450.hg19[probe] | |
93 f <- data.table(probe=names(probe.info),CHR=as.data.frame(probe.info@seqnames)$value, | |
94 BP=as.numeric(probe.info@elementMetadata$probeStart)) | |
95 designMatrix <- model.matrix(~ TAB$Phenotype) | |
96 DMR <- bumphunter(values, design = designMatrix, | |
97 pos=f$BP,cutoff=cutoff,chr=f$CHR) | |
98 MAT <- DMR$table[which(DMR$table$L>=clusterSize),] | |
99 METH <- GRanges(seqnames=MAT$chr, | |
100 ranges=IRanges | |
101 (start=MAT$start, | |
102 end=MAT$end), | |
103 value_pos=MAT$value) | |
104 peaks<-findOverlapsOfPeaks(probe.info,ChiPseq,maxgap=5000) | |
105 p <- peaks$peaklist$`probe.info///ChiPseq` | |
106 peakAnno <- annotatePeak(p, file=peakAnno) | |
107 output_file <- annotatePeak(p, file=output_file) | |
108 }} | |
109 ) | |
110 a<-c(3.2,3.7,3.6,3.9,3.7,3.5,3.8,4,3.5) | |
111 a<-c(3.2,3.7,3.6,3.9,3.7,3.5,3.8,4,3.5) | |
112 b<-c(2.9,2.7,2,6,2.7,2.5,2.5,3.2,3.1,3.3,2.8) | |
113 a-b | |
114 file<-read.csv("~/Documents/SS2.csv") | |
115 head(file) | |
116 e | |
117 file | |
118 t.test(file$WBT,file$WBA) | |
119 t.test(file$WBT,file$WBA,paired=TRUE) | |
120 mysamples <- lapply(TAB$ID,function(x) TablegetGEO(x)) | |
121 require("GEOquery",quietly = TRUE) | |
122 require("BiocGenerics",quietly = TRUE) | |
123 args <- commandArgs(trailingOnly = TRUE) | |
124 csv_file = args[1] | |
125 #csv_file <- ("test-data/input.csv") | |
126 TAB=read.csv(csv_file) | |
127 if(is.null(TAB)){ | |
128 stop("Must specify input files") | |
129 }else{ | |
130 mysamples <- lapply(TAB$ID,function(x) TablegetGEO(x)) | |
131 } | |
132 csv_file <- ("test-data/input.csv") | |
133 TAB=read.csv(csv_file) | |
134 TAB | |
135 csv_file<-("test-data/input.csv") | |
136 TAB = read.csv(csv_file) | |
137 TAB | |
138 ??bumphunter |