annotate lib/convert_nr_2_annot.pl @ 3:17ce4f3bffa2 default tip

Uploaded
author jesse-erdmann
date Tue, 24 Jan 2012 18:33:41 -0500
parents 1437a2df99c0
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
1 #This script annotates genomic positions to genes for ingenuity analyses.
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
2 #Aaron Sarver November 15, 2010
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
3 #version #1.0
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
4
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
5 $in =$ARGV[0];
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
6 $out = $ARGV[1];
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
7
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
8 @lib_list=();
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
9 %seen=();
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
10
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
11 @uniq = ();
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
12 $libstring = '';
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
13
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
14
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
15
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
16 #open SOURCE, "< Med-nr-7-0.01.txt";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
17 open SOURCE, "< $in";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
18 open OUT, "> CIS/input.txt";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
19 open FIN, "> $out";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
20 while (defined($line = <SOURCE>)) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
21 $count++;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
22 chomp $line;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
23 @field= split(/\t/, $line);
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
24 $start = $field[1]-50;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
25 $stop = $field[1]+50;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
26
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
27 print OUT "$field[0]\t$start\t$stop\n";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
28 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
29 close OUT;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
30
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
31 system('perl lib/feature_finder.pl -i CIS/input.txt -icol 1:2:3:6:13 -f lib/mm9.bed -o CIS/input2.txt');
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
32
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
33
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
34 open SOURCE, "< CIS/input2.txt";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
35 while (defined($line = <SOURCE>)) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
36 $count++;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
37 chomp $line;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
38 @field= split(/\t/, $line);
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
39 #print "$field[0]\n";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
40 @genes= split(/,\s/,$field[3]);
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
41 foreach $gene (@genes) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
42 #print "$gene\n";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
43 push (@lib_list,$gene);
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
44 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
45 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
46
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
47
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
48 foreach $item (@lib_list) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
49 unless ($seen{$item}) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
50 $seen{$item}= 1;
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
51 push(@uniq,$item)
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
52 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
53
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
54 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
55
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
56 #open OUT, "> ingenuity_nr.txt";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
57 foreach $item(@uniq) {
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
58
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
59 print FIN "$item\t10\n";
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
60
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
61 }
1437a2df99c0 Uploaded
jesse-erdmann
parents:
diff changeset
62 close FIN;