annotate Roary/lib/Bio/Roary/CommandLine/RoaryPostAnalysis.pm @ 0:c47a5f61bc9f draft

Uploaded
author dereeper
date Fri, 14 May 2021 20:27:06 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
1 undef $VERSION;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
2 package Bio::Roary::CommandLine::RoaryPostAnalysis;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
3
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
4 # ABSTRACT: Perform the post analysis on the pan genome
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
5
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
6 =head1 SYNOPSIS
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
7
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
8 Perform the post analysis on the pan genome
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
9
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
10 =cut
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
11
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
12 use Moose;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
13 use Getopt::Long qw(GetOptionsFromArray);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
14 use Bio::Roary::PostAnalysis;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
15 use File::Find::Rule;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
16 use Bio::Roary::External::GeneAlignmentFromNucleotides;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
17 use File::Path qw(remove_tree);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
18 use Bio::Roary::External::Fasttree;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
19 extends 'Bio::Roary::CommandLine::Common';
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
20
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
21 has 'args' => ( is => 'ro', isa => 'ArrayRef', required => 1 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
22 has 'script_name' => ( is => 'ro', isa => 'Str', required => 1 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
23 has 'help' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
24 has '_error_message' => ( is => 'rw', isa => 'Str' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
25
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
26 has 'fasta_files' => ( is => 'rw', isa => 'Str', default => '_fasta_files' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
27 has 'input_files' => ( is => 'rw', isa => 'Str', default => '_gff_files');
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
28 has 'output_filename' => ( is => 'rw', isa => 'Str', default => 'clustered_proteins' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
29 has 'output_pan_geneome_filename' => ( is => 'rw', isa => 'Str', default => 'pan_genome.fa' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
30 has 'output_statistics_filename' => ( is => 'rw', isa => 'Str', default => 'gene_presence_absence.csv' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
31 has 'output_multifasta_files' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
32 has 'clusters_filename' => ( is => 'rw', isa => 'Str', default => '_clustered.clstr' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
33 has 'job_runner' => ( is => 'rw', isa => 'Str', default => 'Local' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
34 has 'cpus' => ( is => 'rw', isa => 'Int', default => 1 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
35 has 'dont_delete_files' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
36 has 'dont_create_rplots' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
37 has 'dont_split_groups' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
38 has 'verbose_stats' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
39 has 'translation_table' => ( is => 'rw', isa => 'Int', default => 11 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
40 has 'group_limit' => ( is => 'rw', isa => 'Num', default => 50000 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
41 has 'core_definition' => ( is => 'rw', isa => 'Num', default => 0.99 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
42 has 'verbose' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
43 has 'mafft' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
44 has 'allow_paralogs' => ( is => 'rw', isa => 'Bool', default => 0 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
45
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
46 sub BUILD {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
47 my ($self) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
48
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
49 my (
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
50 $output_filename, $dont_create_rplots, $dont_delete_files, $dont_split_groups, $output_pan_geneome_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
51 $job_runner, $output_statistics_filename, $output_multifasta_files, $clusters_filename, $core_definition,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
52 $fasta_files, $input_files, $verbose_stats, $translation_table, $help, $cpus,$group_limit,$verbose,$mafft, $allow_paralogs
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
53 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
54
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
55
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
56 GetOptionsFromArray(
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
57 $self->args,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
58 'o|output=s' => \$output_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
59 'j|job_runner=s' => \$job_runner,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
60 'm|output_multifasta_files' => \$output_multifasta_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
61 'p=s' => \$output_pan_geneome_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
62 's=s' => \$output_statistics_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
63 'c=s' => \$clusters_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
64 'f=s' => \$fasta_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
65 'i=s' => \$input_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
66 'a|dont_delete_files' => \$dont_delete_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
67 'b|dont_create_rplots' => \$dont_create_rplots,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
68 'd|dont_split_groups' => \$dont_split_groups,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
69 'e|verbose_stats' => \$verbose_stats,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
70 'z|processors=i' => \$cpus,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
71 't|translation_table=i' => \$translation_table,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
72 'g|group_limit=i' => \$group_limit,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
73 'cd|core_definition=f' => \$core_definition,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
74 'v|verbose' => \$verbose,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
75 'n|mafft' => \$mafft,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
76 'q|allow_paralogs' => \$allow_paralogs,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
77 'h|help' => \$help,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
78 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
79
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
80 $self->help($help) if(defined($help));
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
81 $self->job_runner($job_runner) if ( defined($job_runner) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
82 $self->fasta_files($fasta_files) if ( defined($fasta_files) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
83 $self->input_files($input_files) if ( defined($input_files) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
84 $self->output_filename($output_filename) if ( defined($output_filename) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
85 $self->output_pan_geneome_filename($output_pan_geneome_filename) if ( defined($output_pan_geneome_filename) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
86 $self->output_statistics_filename($output_statistics_filename) if ( defined($output_statistics_filename) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
87 $self->output_multifasta_files($output_multifasta_files) if ( defined($output_multifasta_files) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
88 $self->clusters_filename($clusters_filename) if ( defined($clusters_filename) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
89 $self->dont_delete_files($dont_delete_files) if ( defined($dont_delete_files) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
90 $self->dont_create_rplots($dont_create_rplots) if ( defined($dont_create_rplots) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
91 $self->dont_split_groups($dont_split_groups) if ( defined($dont_split_groups) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
92 $self->verbose_stats($verbose_stats) if ( defined($verbose_stats));
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
93 $self->translation_table($translation_table) if ( defined($translation_table) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
94 $self->cpus($cpus) if ( defined($cpus) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
95 $self->group_limit($group_limit) if ( defined($group_limit) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
96 $self->core_definition( $core_definition/100 ) if ( defined($core_definition) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
97 $self->mafft($mafft) if ( defined($mafft) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
98 $self->allow_paralogs($allow_paralogs) if ( defined($allow_paralogs) );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
99 if ( defined($verbose) ) {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
100 $self->verbose($verbose);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
101 $self->logger->level(10000);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
102 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
103 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
104
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
105 sub run {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
106 my ($self) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
107
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
108 ( !$self->help ) or die $self->usage_text;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
109 if ( defined( $self->_error_message ) ) {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
110 print $self->_error_message . "\n";
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
111 die $self->usage_text;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
112 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
113
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
114 my $input_files = $self->_read_file_into_array($self->input_files);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
115 my $obj = Bio::Roary::PostAnalysis->new(
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
116 fasta_files => $self->_read_file_into_array($self->fasta_files) ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
117 input_files => $input_files ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
118 output_filename => $self->output_filename ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
119 output_pan_geneome_filename => $self->output_pan_geneome_filename,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
120 output_statistics_filename => $self->output_statistics_filename ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
121 output_multifasta_files => $self->output_multifasta_files ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
122 clusters_filename => $self->clusters_filename ,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
123 dont_delete_files => $self->dont_delete_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
124 dont_create_rplots => $self->dont_create_rplots,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
125 dont_split_groups => $self->dont_split_groups,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
126 verbose_stats => $self->verbose_stats,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
127 group_limit => $self->group_limit,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
128 verbose => $self->verbose,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
129 cpus => $self->cpus,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
130 logger => $self->logger,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
131 core_definition => $self->core_definition,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
132 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
133 $obj->run();
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
134
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
135 if($self->dont_delete_files == 0)
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
136 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
137 unlink('_inflated_unsplit_mcl_groups');
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
138 remove_tree('split_groups');
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
139 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
140
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
141 if($self->output_multifasta_files == 1)
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
142 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
143 print "Aligning each cluster\n" if($self->verbose);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
144
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
145 my $job_runner_to_use = $self->job_runner;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
146 if($self->_is_lsf_job_runner_available && $self->job_runner eq "LSF")
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
147 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
148 $job_runner_to_use = $self->job_runner;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
149 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
150 else
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
151 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
152 $job_runner_to_use = 'Parallel';
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
153 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
154
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
155 my $output_gene_files = $self->_find_input_files;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
156 my $seg = Bio::Roary::External::GeneAlignmentFromNucleotides->new(
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
157 fasta_files => $output_gene_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
158 job_runner => $job_runner_to_use,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
159 translation_table => $self->translation_table,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
160 core_definition => $self->core_definition,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
161 cpus => $self->cpus,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
162 verbose => $self->verbose,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
163 mafft => $self->mafft,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
164 allow_paralogs => $self->allow_paralogs,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
165 dont_delete_files => $self->dont_delete_files,
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
166 num_input_files => $#{$input_files},
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
167 );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
168 $seg->run();
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
169 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
170 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
171
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
172 sub _is_lsf_job_runner_available
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
173 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
174 my ($self) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
175 my $rc = eval "require Bio::Roary::JobRunner::LSF; 1;";
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
176 if(defined($rc) && $rc == 1)
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
177 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
178 return 1;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
179 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
180 else
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
181 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
182 return 0;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
183 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
184 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
185
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
186 sub _find_input_files
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
187 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
188 my ($self) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
189 my @files = File::Find::Rule->file()
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
190 ->name( '*.fa' )
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
191 ->in('pan_genome_sequences' );
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
192 return \@files;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
193 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
194
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
195 sub _read_file_into_array
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
196 {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
197 my ($self, $filename) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
198 open(my $in_fh, $filename);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
199
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
200 my @filenames;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
201 while(<$in_fh>){
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
202 chomp;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
203 my $line = $_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
204 push(@filenames, $line);
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
205 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
206 return \@filenames;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
207 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
208
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
209 sub usage_text {
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
210 my ($self) = @_;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
211
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
212 return <<USAGE;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
213 Usage: pan_genome_post_analysis [options]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
214 Perform the post analysis on the pan genome. This script is usally only called by another script.
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
215
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
216 Options: -a dont delete intermediate files
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
217 -b dont create R plots
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
218 -c STR clusters filename [_clustered.clstr]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
219 -cd FLOAT percentage of isolates a gene must be in to be core [0.99]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
220 -d dont split groups
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
221 -e add inference values to gene presence and absence spreadsheet
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
222 -f STR file of protein filenames [_fasta_files]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
223 -g INT maximum number of clusters [50000]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
224 -i STR file of GFF filenames [_gff_files]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
225 -m core gene alignement with PRANK
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
226 -n fast core gene alignement with MAFFT instead of PRANK
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
227 -o STR clusters output filename [clustered_proteins]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
228 -p STR output pan genome filename [pan_genome.fa]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
229 -q allow paralogs in core alignment
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
230 -s STR output gene presence and absence filename [gene_presence_absence.csv]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
231 -t INT translation table [11]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
232 -z INT number of threads [1]
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
233 -v verbose output to STDOUT
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
234 -h this help message
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
235
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
236 For further info see: http://sanger-pathogens.github.io/Roary/
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
237 USAGE
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
238 }
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
239
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
240 __PACKAGE__->meta->make_immutable;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
241 no Moose;
c47a5f61bc9f Uploaded
dereeper
parents:
diff changeset
242 1;