annotate cpt_psm_recombine/lib/CPT/Bio.pm @ 0:b18e8268bf4e draft

Uploaded
author cpt
date Tue, 05 Jul 2022 05:05:13 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
1 package CPT::Bio;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
2 use Moose;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
3 use strict;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
4 use warnings;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
5 use autodie;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
6 use CPT::FiletypeDetector;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
7 use CPT::BioData;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
8 my $bd = CPT::BioData->new();
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
9
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
10 my $filetype = CPT::FiletypeDetector->new();
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
11
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
12 has 'var_translate' => ( is => 'rw', isa => 'Bool');
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
13 has 'var_header' => ( is => 'rw', isa => 'Bool');
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
14 has codonTable => (
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
15 is => 'rw',
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
16 isa => 'Any',
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
17 default => sub {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
18 $bd->getTranslationTable(11)
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
19 },
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
20 );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
21
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
22 sub set_codon_table {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
23 my ($self, $num) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
24 $self->codonTable($bd->getTranslationTable($num));
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
25 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
26
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
27
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
28 sub _getFeatureTag {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
29 my ( $self, $feat, $tag ) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
30 if(! defined($feat)){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
31 warn "Undefined feature";
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
32 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
33 return $feat->has_tag($tag)
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
34 ? ( join( ',', $feat->get_tag_values($tag) ) )
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
35 : '';
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
36 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
37
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
38 sub _getIdentifier {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
39 my ( $self, $feat ) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
40 my $line;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
41 if ( ref $feat eq 'Bio::Seq::RichSeq' || ref $feat eq 'Bio::Seq' ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
42 return $feat->display_id;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
43 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
44 else {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
45 my $locus_tag = $self->_getFeatureTag( $feat, 'locus_tag' );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
46 if ($locus_tag) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
47 return $locus_tag;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
48 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
49 my $gene = $self->_getFeatureTag( $feat, 'gene' );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
50 if ($gene) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
51 return $gene;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
52 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
53 my $product = $self->_getFeatureTag( $feat, 'product' );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
54 if ($product) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
55 return $product;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
56 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
57 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
58 return sprintf("%s_%s_%s", $feat->start(), $feat->end(), ($feat->strand() == 1 ? 'sense':'antisense'));
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
59 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
60
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
61
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
62 sub requestCopy {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
63 my ( $self, %data ) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
64 use Bio::SeqIO;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
65 if ($data{'file'} ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
66 my ($guessed_type) = $filetype->detect( $data{'file'} );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
67 my $seqio = Bio::SeqIO->new(
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
68 -file => $data{'file'},
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
69 -format => $guessed_type
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
70 );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
71 my @results;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
72 while ( my $seqobj = $seqio->next_seq() ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
73 return \$seqobj;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
74 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
75 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
76 else {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
77 die "No file specified";
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
78 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
79 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
80
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
81
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
82 sub getSeqIO {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
83 my ( $self, $file ) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
84 use Bio::SeqIO;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
85 if ($file ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
86 my ($guessed_type) = $filetype->detect( $file );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
87 my $seqio = Bio::SeqIO->new(
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
88 -file => $file,
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
89 -format => $guessed_type
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
90 );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
91 return $seqio;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
92 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
93 else {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
94 die "No file specified";
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
95 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
96 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
97
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
98
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
99 sub parseFile {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
100 my ( $self, %data ) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
101 use Bio::SeqIO;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
102
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
103 my ($guessed_type) = $filetype->detect( $data{'file'} );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
104 my $seqio = Bio::SeqIO->new(
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
105 -file => $data{'file'},
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
106 -format => $guessed_type
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
107 );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
108
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
109 # Are we to translate this
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
110 $self->var_translate(defined($data{translate}) && $data{translate});
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
111 $self->var_header(defined($data{header}) && $data{header});
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
112
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
113 my @results;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
114 if ( not defined $data{'subset'} ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
115 $data{'subset'} = 'all';
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
116 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
117 while ( my $seqobj = $seqio->next_seq() ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
118 if (
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
119 (ref $data{'subset'} ne 'ARRAY'
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
120 && $data{'subset'} eq 'whole' ) # Want the whole thing for a richseq
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
121 ||
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
122 (ref $seqobj eq 'Bio::Seq' || ref $seqobj eq 'Bio::Seq::fasta')
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
123 # or it's a fasta type sequence
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
124 )
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
125 {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
126 push( @results, $self->handle_seq($seqobj));
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
127 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
128 else #data subset eq sometag
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
129 {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
130 my %wanted_tags;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
131 if ( ref $data{'subset'} eq 'ARRAY' ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
132 %wanted_tags =
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
133 map { $_ => 1 } @{ $data{'subset'} };
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
134 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
135 else {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
136 $wanted_tags{ $data{'subset'} }++;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
137 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
138 foreach my $feat ( $seqobj->get_SeqFeatures ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
139 if (
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
140 $wanted_tags{ $feat->primary_tag }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
141 || ( $wanted_tags{'all'}
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
142 && $feat->primary_tag ne
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
143 "source" )
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
144 )
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
145 {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
146 push( @results, $self->handle_seq($feat));
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
147 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
148 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
149 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
150 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
151 if ( $data{'callback'} ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
152 $data{'callback'}->( \@results );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
153 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
154 else {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
155 return \@results;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
156 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
157 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
158
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
159 sub handle_seq {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
160 my ($self, $obj) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
161
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
162 my @line;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
163 if ( $self->var_header() ){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
164 $line[0] = '>' . $self->_getIdentifier($obj);
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
165 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
166
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
167 # Get our sequence
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
168 $line[1] = $self->intelligent_get_seq($obj);
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
169
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
170 if ( $self->var_translate() ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
171 $line[1] = $self->translate($line[1]);
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
172 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
173 return \@line;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
174 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
175
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
176 sub intelligent_get_seq {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
177 my ($self, $obj, %extra) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
178 # Top level, e.g., fasta/gbk file, "extra" doesn't apply to these
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
179 if ( ref $obj eq 'Bio::Seq::RichSeq' || ref $obj eq 'Bio::Seq' ) {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
180 return $obj->seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
181 }else{
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
182 return $self->get_seq_from_feature($obj, %extra);
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
183 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
184 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
185 sub get_seq_from_feature {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
186 my ($self, $feat, %extra) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
187 my $seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
188 my $l;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
189 if($extra{parent}){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
190 $l = $extra{parent}->length();
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
191 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
192
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
193 if($extra{upstream}){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
194 if($feat->strand < 0){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
195 my $y = $feat->end + 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
196 my $z = $feat->end + $extra{upstream};
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
197 if($y < $l){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
198 if($z > $l){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
199 $z = $l;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
200 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
201 $seq .= $extra{parent}->trunc($y, $z)->revcom->seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
202 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
203 }else{
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
204 my $y = $feat->start - $extra{upstream};
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
205 my $z = $feat->start - 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
206 if($z > 0){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
207 if($y < 1){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
208 $y = 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
209 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
210 $seq .= $extra{parent}->trunc($y, $z)->seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
211 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
212 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
213 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
214 if(ref($feat->location) eq 'Bio::Location::Simple'){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
215 $seq .= $feat->seq->seq();
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
216 }else{
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
217 $seq .= $feat->spliced_seq->seq();
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
218 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
219 if($extra{downstream}){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
220 if($feat->strand < 0){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
221 my $y = $feat->start - $extra{downstream};
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
222 my $z = $feat->start - 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
223 if($z > 0){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
224 if($y < 1){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
225 $y = 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
226 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
227 $seq .= $extra{parent}->trunc($y, $z)->revcom->seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
228 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
229 }else{
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
230 my $y = $feat->end + 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
231 my $z = $feat->end + $extra{downstream};
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
232 if($y < $l){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
233 if($z > $l){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
234 $z = $l;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
235 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
236 $seq .= $extra{parent}->trunc($y, $z)->seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
237 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
238 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
239 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
240
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
241 return $seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
242 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
243
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
244
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
245 sub translate {
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
246 my ($self, $seq) = @_;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
247 if($seq =~ /^[ACTGN]+$/){
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
248 my %ct = %{$self->codonTable};
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
249 $seq = join( '' , map { if($ct{$_}){ $ct{$_} }else{ () } } unpack("(A3)*", $seq));
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
250 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
251 return $seq;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
252 }
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
253
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
254 no Moose;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
255 1;
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
256
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
257 __END__
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
258
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
259 =pod
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
260
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
261 =encoding UTF-8
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
262
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
263 =head1 NAME
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
264
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
265 CPT::Bio
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
266
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
267 =head1 VERSION
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
268
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
269 version 1.99.4
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
270
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
271 =head2 _getFeatureTag
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
272
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
273 my $tag = $libCPT->_getFeatureTag($feature,'note');
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
274
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
275 returns all values of the given tag, joined with ','.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
276
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
277 =head2 requestCopy
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
278
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
279 my $seqobj = $libCPT->requestCopy('file'=>'test.gbk');
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
280
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
281 requests a 'copy' of a given Bio::SeqIO file, which allows for addition of features before writing out to file.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
282
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
283 =head2 getSeqIO
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
284
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
285 my $seqio = $libCPT->getSeqIO('file'=>'test.gbk');
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
286
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
287 requests a 'copy' of a given Bio::SeqIO file, which allows for addition of features before writing out to file.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
288
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
289 =head2 parseFile
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
290
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
291 $libCPT->parseFile(
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
292 'file' => $options{'file'},
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
293 'callback' => \&func,
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
294 'translate' => 1,
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
295 'header' => 1,
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
296 'subset' => ['CDS', $options{'tag'}],
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
297 );
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
298
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
299 Arguably the most important function in this library, wraps a lot of functionality in a clean wrapper, since most of the scripts we have are written around data munging.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
300
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
301 =over 4
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
302
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
303 =item *
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
304
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
305 file - the Bio::SeqIO file to process
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
306
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
307 =item *
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
308
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
309 callback - the function to send our data to. Done all at once, in an array
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
310
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
311 =item *
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
312
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
313 translate - should we translate the sequence to amino acids if it's not already.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
314
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
315 =item *
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
316
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
317 subset - either "whole", a valid tag, or an array of valid tags
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
318
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
319 =item *
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
320
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
321 header - Do we want a header (FASTA) with our result set
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
322
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
323 =back
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
324
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
325 =head1 AUTHOR
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
326
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
327 Eric Rasche <rasche.eric@yandex.ru>
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
328
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
329 =head1 COPYRIGHT AND LICENSE
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
330
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
331 This software is Copyright (c) 2014 by Eric Rasche.
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
332
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
333 This is free software, licensed under:
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
334
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
335 The GNU General Public License, Version 3, June 2007
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
336
b18e8268bf4e Uploaded
cpt
parents:
diff changeset
337 =cut