annotate splicetrap/bin/scanbed2txdb.pl @ 7:37a16ff93dd9 draft default tip

planemo upload
author bioitcore
date Thu, 12 Oct 2017 16:26:36 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
1 #argv0: input transcript bed file
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
2 #argv1: output filename, will be in AS format
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
3
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
4 use strict;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
5 my $AnnoFileName = $ARGV[0];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
6 my $outputFileName = $ARGV[1];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
7
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
8 if($AnnoFileName eq "" or $outputFileName eq "")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
9 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
10 print "TXDBGEN: Please specify your input files\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
11 exit;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
12 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
13
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
14 my $cachefolder = `basename $outputFileName`;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
15 chomp($cachefolder);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
16 my $cachefolder = $cachefolder.".cache";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
17 my $AnnoFileBase = `basename $AnnoFileName`;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
18 chomp($AnnoFileBase);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
19
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
20 if(! -e $cachefolder)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
21 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
22 mkdir $cachefolder or die "CHECK: cannot mkdir $cachefolder\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
23 print "TXDBGEN: mkdir $cachefolder\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
24 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
25
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
26 my $CacheAnnoFileName = $cachefolder."/".$AnnoFileBase.".sort";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
27 #sort the annotation file
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
28
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
29 print "TXDBGEN: sort $AnnoFileName \n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
30
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
31 system("sort -k6,6 -k1,1 -k2,2n -k3,3n $AnnoFileName >$CacheAnnoFileName");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
32
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
33 $AnnoFileName = $CacheAnnoFileName;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
34
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
35 #read the annotations into hashes
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
36
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
37 open(AnnoFile, $CacheAnnoFileName) or die "can not open",$CacheAnnoFileName;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
38 #split the genes into contigs
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
39
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
40 my $contigid = 0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
41 my $end_tmp = 0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
42 my $chr_tmp = "chr";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
43 my $strand_tmp="NA";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
44
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
45 my $TXnumtmp=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
46
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
47 my %eventlist =();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
48 #my %eventlist_af = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
49 #my %eventlist_al = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
50 my %evidences = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
51
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
52 open(my $output,">$outputFileName");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
53
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
54 open(my $output2, ">$outputFileName.evi");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
55 while(my $line =<AnnoFile>)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
56 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
57 chomp($line);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
58 my @a = split("\t",$line);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
59 my $chr = $a[0];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
60 my $start = $a[1];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
61 my $end = $a[2];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
62 my $name = $a[3];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
63 my @sizes = split(",",$a[10]);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
64 my $strand = $a[5];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
65 my @start_shifts = split(",",$a[11]);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
66 #my $chrstr = $chr.$strand;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
67 my @starts;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
68 my @ends;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
69 for(my $i=0;$i<@start_shifts;$i++)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
70 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
71 $starts[$i]=$start_shifts[$i]+$start;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
72 $ends[$i] = $starts[$i]+$sizes[$i];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
73 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
74 if($start >$end_tmp or $chr ne $chr_tmp or $strand_tmp ne $strand)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
75 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
76 $contigid++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
77 #$ctgmultisonum++ if $TXnumtmp>1;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
78 $TXnumtmp=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
79 my $annos = scanevents(\%eventlist, "inner") ;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
80 #my $annos_af = scanevents(\%eventlist_af, "af");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
81 #my $annos_al = scanevents(\%eventlist_al, "al");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
82
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
83 my $stdout = select ($output);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
84 my $eventids = printanno($annos,$chr_tmp,$strand_tmp) if(scalar(%$annos)>0);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
85 #printanno($annos_af,$chr_tmp,$strand_tmp) if(scalar(%$annos_af)>0);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
86 #printanno($annos_al,$chr_tmp,$strand_tmp) if(scalar(%$annos_al)>0);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
87 select($stdout);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
88 $stdout = select ($output2);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
89 #print cross information
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
90 foreach my $connect_str (keys %$eventids)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
91 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
92 print $eventids->{$connect_str},"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
93 foreach my $transcriptid (keys %{$evidences{$connect_str}})
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
94 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
95 print $transcriptid,",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
96 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
97 print "\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
98 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
99 select($stdout);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
100 print "TXDBGEN: Contig ID $contigid at $chr $strand...\n" if ( $contigid%1000 == 0);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
101 %eventlist = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
102 #%eventlist_al = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
103 #%eventlist_af = ();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
104 #print CacheContigFile "#ctg$contigid\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
105
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
106 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
107 $TXnumtmp++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
108 $end_tmp = $end if ($end > $end_tmp or $chr ne $chr_tmp or $strand_tmp ne $strand);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
109 $chr_tmp = $chr;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
110
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
111 $strand_tmp = $strand;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
112
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
113 #scan connections, 2 and 3 exons for CA/CS/AF
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
114 # if(scalar(@starts)>2)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
115 # {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
116 # my $connectionstr_af =$starts[0]."-".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
117 # $ends[0].",".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
118 # $starts[1]."-".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
119 # $ends[1]."," ;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
120 #
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
121 # $eventlist_af{$connectionstr_af} = $starts[0];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
122 # my $connectionstr_al = $starts[scalar(@starts)-2]."-".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
123 # $ends[scalar(@starts)-2].",".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
124 # $starts[scalar(@starts)-1]."-".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
125 # $ends[scalar(@starts)-1]."," ;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
126 # $eventlist_al{$connectionstr_al} = $starts[scalar(@starts)-2];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
127 # }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
128 #didn't consider direction yet
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
129 #add 1 exon for IR
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
130 for(my $n=1;$n<4;$n++)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
131 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
132 for(my $i=0;$i<scalar(@starts)-$n+1;$i++)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
133 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
134 my $connectionstr = "";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
135 for(my $j=$i;$j<$i+$n;$j++)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
136 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
137 $connectionstr = $connectionstr .
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
138 $starts[$j]."-".
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
139 $ends[$j].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
140 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
141 # print $connectionstr,"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
142 $eventlist{$connectionstr} = $n;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
143 $evidences{$connectionstr}{$name} = 1;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
144 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
145
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
146 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
147
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
148 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
149
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
150 my $annos = scanevents(\%eventlist, "inner");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
151 #my $annos_af = scanevents(\%eventlist_af, "af");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
152 #my $annos_al = scanevents(\%eventlist_al, "al");
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
153
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
154 my $stdout = select ($output);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
155 my $eventids = printanno($annos,$chr_tmp,$strand_tmp) if(scalar(%$annos)>0);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
156 select ($stdout);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
157 $stdout = select ($output2);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
158 #print cross information
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
159 foreach my $connect_str (keys %$eventids)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
160 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
161 print $eventids->{$connect_str},"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
162 foreach my $transcriptid (keys %{$evidences{$connect_str}})
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
163 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
164 print $transcriptid,",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
165 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
166 print "\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
167 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
168
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
169 select($stdout);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
170
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
171 close($output);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
172 close($output2);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
173
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
174 #close(CacheContigFile);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
175 #define sub scanevents
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
176 sub scanevents
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
177 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
178 my ($eventlist,$mode)=@_;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
179 my %anno=();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
180 if($mode eq "inner")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
181 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
182 foreach my $key (keys %$eventlist)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
183 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
184 #print $key,"\t",$eventlist->{$key},"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
185 if($eventlist->{$key} == 3)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
186 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
187 my @a=split(",",$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
188 my $connectstr_ca=$a[0].",".$a[2].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
189 if (exists $eventlist->{$connectstr_ca})
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
190 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
191 $anno{$key}="ca";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
192 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
193 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
194 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
195 $anno{$key}="cs";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
196 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
197 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
198 if($eventlist->{$key} == 2)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
199 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
200 my @a=split(/[,-]/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
201
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
202 my $connectstr_ir=$a[0]."-".$a[3].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
203 if (exists $eventlist->{$connectstr_ir})
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
204 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
205 $anno{$key}="ir";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
206 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
207 foreach my $search (keys %$eventlist)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
208 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
209 next if($eventlist->{$search}!=2);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
210 my $connectstr_ss="";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
211 my @b=split(/[,-]/,$search);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
212 if($a[0]==$b[0] && $a[3]==$b[3])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
213 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
214 if($a[1]==$b[1])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
215 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
216 next if ($b[2] == $a[2]);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
217 $connectstr_ss .= $a[0]."-".$a[1].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
218 if($b[2]>$a[2])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
219 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
220 $connectstr_ss .= $a[2]."-".$b[2].",".$b[2];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
221 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
222 #elsif($b[2]<$a[2])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
223 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
224 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
225 $connectstr_ss .= $b[2]."-".$a[2].",".$a[2];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
226 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
227 $connectstr_ss .= "-".$a[3].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
228 $anno{$connectstr_ss}="ss";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
229 #print $connectstr_ss,"\tss\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
230 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
231 if($a[2]==$b[2])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
232 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
233 $connectstr_ss .= $a[0]."-";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
234 if($b[1]>$a[1])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
235 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
236 $connectstr_ss .= $a[1].",".$a[1]."-".$b[1];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
237 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
238 #elsif($b[2]<$a[2])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
239 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
240 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
241 $connectstr_ss .= $b[1].",".$b[1]."-".$a[1];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
242 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
243 $connectstr_ss .= ",".$a[2]."-".$a[3].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
244 $anno{$connectstr_ss}="ss";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
245 #print $connectstr_ss,"\tss\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
246 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
247
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
248
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
249 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
250
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
251 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
252 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
253 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
254 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
255 if($mode eq "af" or $mode eq "al")#alternative first/last exon
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
256 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
257 foreach my $key (keys %$eventlist)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
258 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
259 my @a=split(/,/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
260 foreach my $search (keys %$eventlist)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
261 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
262 next if $search eq $key;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
263 my $connectstr = "";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
264 if($eventlist->{$search} < $eventlist->{$key} )
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
265 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
266 $connectstr = $search."|".$key;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
267 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
268 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
269 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
270 $connectstr = $key."|".$search;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
271 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
272 next if exists $anno{$connectstr};
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
273 my @b=split(/,/,$search);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
274 if($mode eq "af")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
275 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
276 if($a[0] ne $b[0] and $a[1] eq $b[1])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
277 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
278 $anno{$connectstr} = $mode;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
279 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
280 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
281 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
282 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
283 if($a[0] eq $b[0] and $a[1] ne $b[1])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
284 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
285 $anno{$connectstr} = $mode;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
286 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
287 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
288
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
289 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
290 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
291 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
292 return(\%anno);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
293 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
294
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
295
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
296 sub printanno
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
297 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
298 # print the annotations
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
299 # and return the connectstr and event id to be used to print evidences
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
300 my %eventids=();
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
301 my ($annos,$chr,$strand)=@_;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
302 my %nums_per_isoform;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
303 foreach my $key (keys %$annos)
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
304 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
305 if($annos->{$key} eq "af")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
306 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
307 my @a=split(/[\,\-\|]+/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
308 my $chrid=substr($chr,3,length($chr)-3);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
309 my $id_anno="AF";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
310 #consider direction later
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
311 my $id=join("-",$id_anno,$id_anno, $a[2],$a[3]);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
312 my $num=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
313 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
314 $nums_per_isoform{$id}++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
315
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
316 print $chr,"\t",$a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
317 print $id.".".$num,"[L]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
318 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
319 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
320 print $a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
321 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
322 print "2\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
323 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
324 print $a[3]-$a[2],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
325 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
326 print $a[2]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
327
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
328 print $chr,"\t",$a[4],"\t",$a[7],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
329 print $id.".".$num,"[R]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
330 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
331 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
332 print $a[4],"\t",$a[7],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
333 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
334 print "2\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
335 print $a[5]-$a[4],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
336 print $a[7]-$a[6],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
337 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
338 print $a[6]-$a[4],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
339
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
340 #print "$key,af\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
341 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
342 if($annos->{$key} eq "ca" or $annos->{$key} eq "cs")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
343 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
344 my @a=split(/[,-]/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
345
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
346 my $chrid=substr($chr,3,length($chr)-3);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
347 my $id_anno="CS";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
348 $id_anno="CA" if $annos->{$key} eq "ca";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
349 my $id="CA-$id_anno-$chrid"."-".$a[2]."-".$a[3];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
350 my $num=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
351 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
352 $nums_per_isoform{$id}++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
353
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
354 print $chr,"\t",$a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
355 print $id.".".$num,"[L]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
356 $eventids {$key} = $id.".".$num."[L]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
357 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
358 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
359 print $a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
360 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
361 print "3\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
362 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
363 print $a[3]-$a[2],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
364 print $a[5]-$a[4],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
365 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
366 print $a[2]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
367 print $a[4]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
368
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
369 print $chr,"\t",$a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
370 print $id.".".$num,"[S]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
371 my $connectstr_ca= $a[0]."-".$a[1].",".$a[4]."-".$a[5].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
372 $eventids{$connectstr_ca} = $id.".".$num."[S]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
373 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
374 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
375 print $a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
376 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
377 print "2\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
378 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
379 #print $a[3]-$a[2],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
380 print $a[5]-$a[4],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
381 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
382 #print $a[2]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
383 print $a[4]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
384
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
385 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
386 if($annos->{$key} eq "ir")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
387 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
388 my @a=split(/[,-]/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
389
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
390 my $chrid=substr($chr,3,length($chr)-3);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
391 my $id="IR-IR-$chrid"."-".$a[1]."-".$a[2];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
392 my $num=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
393 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
394 $nums_per_isoform{$id}++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
395
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
396 print $chr,"\t",$a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
397 print $id.".".$num,"[L]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
398 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
399 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
400 print $a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
401 $eventids{$a[0]."-".$a[3].","} = $id.".".$num."[L]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
402 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
403 print "3\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
404 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
405 print $a[2]-$a[1],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
406 print $a[3]-$a[2],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
407 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
408 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
409 print $a[2]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
410
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
411 print $chr,"\t",$a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
412 print $id.".".$num,"[S]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
413 $eventids{$key} = $id.".".$num."[S]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
414 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
415 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
416 print $a[0],"\t",$a[3],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
417 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
418 print "2\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
419 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
420 #print $a[3]-$a[2],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
421 print $a[3]-$a[2],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
422 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
423 #print $a[2]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
424 print $a[2]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
425
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
426 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
427 if($annos->{$key} eq "ss")
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
428 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
429 my @a=split(/[,-]/,$key);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
430 my $chrid=substr($chr,3,length($chr)-3);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
431 my $type="AA";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
432 if( ($strand eq "+" && $a[1]==$a[2]) or ($strand eq "-" && $a[3]==$a[4]))
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
433 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
434 $type="AD";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
435 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
436 my $id="$type-$type-$chrid"."-".$a[2]."-".$a[3];
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
437 my $connect_str_L = "";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
438 my $connect_str_S = "";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
439 if($a[1]==$a[2])
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
440 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
441 $connect_str_L = $a[0]."-".$a[3].",".$a[4]."-".$a[5].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
442 $connect_str_S = $a[0]."-".$a[1].",".$a[4]."-".$a[5].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
443 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
444 else
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
445 {
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
446 $connect_str_L = $a[0]."-".$a[1].",".$a[2]."-".$a[5].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
447 $connect_str_S = $a[0]."-".$a[1].",".$a[3]."-".$a[5].",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
448
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
449 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
450 my $num=0;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
451 $num = $nums_per_isoform{$id} if exists $nums_per_isoform{$id};
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
452 $nums_per_isoform{$id}++;
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
453 print $chr,"\t",$a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
454 print $id.".".$num,"[L]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
455 $eventids {$connect_str_L} = $id.".".$num."[L]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
456 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
457 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
458 print $a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
459 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
460 print "3\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
461 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
462 print $a[3]-$a[2],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
463 print $a[5]-$a[4],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
464 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
465 print $a[2]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
466 print $a[4]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
467
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
468 print $chr,"\t",$a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
469 print $id.".".$num,"[S]\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
470 $eventids {$connect_str_S} = $id.".".$num."[S]";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
471 print "0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
472 print $strand,"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
473 print $a[0],"\t",$a[5],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
474 print "255,0,0\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
475 print "2\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
476 print $a[1]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
477 #print $a[3]-$a[2],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
478 print $a[5]-$a[4],"\t";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
479 print "0,";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
480 #print $a[2]-$a[0],",";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
481 print $a[4]-$a[0],"\n";
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
482
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
483
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
484 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
485
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
486 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
487 return(\%eventids);
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
488
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
489 }
37a16ff93dd9 planemo upload
bioitcore
parents:
diff changeset
490