annotate kaks_analysis.xml @ 2:2fe7044626ac draft

Uploaded
author greg
date Thu, 24 Aug 2017 13:41:07 -0400
parents 3aca88613abf
children 1fb0f2092177
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
2fe7044626ac Uploaded
greg
parents: 1
diff changeset
1 <tool id="plant_tribes_kaks_analysis" name="KaKsAnalysis" version="@WRAPPER_VERSION@.2">
0
2f0b8e19286b Uploaded
greg
parents:
diff changeset
2 <description>estimates paralogous and orthologous pairwise synonymous (Ks) and non-synonymous (Ka) substitution rates</description>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
3 <macros>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
4 <import>macros.xml</import>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
5 </macros>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
6 <expand macro="requirements_kaks_analysis" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
7 <command detect_errors="exit_code"><![CDATA[
2f0b8e19286b Uploaded
greg
parents:
diff changeset
8 #set output_dir = 'kaksAnalysis_dir'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
9 #set comparison = $comparison_cond.comparison
2f0b8e19286b Uploaded
greg
parents:
diff changeset
10 #if str($options_type.options_type_selector) == 'advanced':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
11 #set codeml_ctl_file_cond = $options_type.codeml_ctl_file_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
12 #set codeml_ctl_file_select = $codeml_ctl_file_cond.codeml_ctl_file_select
2f0b8e19286b Uploaded
greg
parents:
diff changeset
13 #set fit_components_cond = $options_type.fit_components_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
14 #set fit_components = $fit_components_cond.fit_components
2f0b8e19286b Uploaded
greg
parents:
diff changeset
15 #set recalibrate_cond = $options_type.recalibrate_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
16 #set recalibrate = $recalibrate_cond.recalibrate
2f0b8e19286b Uploaded
greg
parents:
diff changeset
17 #set set_min_coverage_cond = $options_type.set_min_coverage_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
18 #set set_min_coverage = $set_min_coverage_cond.set_min_coverage
2f0b8e19286b Uploaded
greg
parents:
diff changeset
19 #set set_lower_ks_limit_cond = $options_type.set_lower_ks_limit_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
20 #set set_lower_ks_limit = $set_lower_ks_limit_cond.set_lower_ks_limit
2f0b8e19286b Uploaded
greg
parents:
diff changeset
21 #set set_upper_ks_limit_cond = $options_type.set_upper_ks_limit_cond
2f0b8e19286b Uploaded
greg
parents:
diff changeset
22 #set set_upper_ks_limit = $set_upper_ks_limit_cond.set_upper_ks_limit
2f0b8e19286b Uploaded
greg
parents:
diff changeset
23 #else:
2f0b8e19286b Uploaded
greg
parents:
diff changeset
24 #set codeml_ctl_file_select = 'no'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
25 #set fit_components = 'no'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
26 #set set_lower_ks_limit = 'no'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
27 #set set_upper_ks_limit = 'no'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
28 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
29 KaKsAnalysis
2f0b8e19286b Uploaded
greg
parents:
diff changeset
30 --num_threads \${GALAXY_SLOTS:-4}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
31 --coding_sequences_species_1 '$coding_sequences_species_1'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
32 --proteins_species_1 '$proteins_species_1'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
33 --comparison $comparison
2f0b8e19286b Uploaded
greg
parents:
diff changeset
34 #if str($comparison) == 'orthologs':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
35 --coding_sequences_species_2 '$comparison_cond.coding_sequences_species_2'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
36 --proteins_species_2 '$comparison_cond.proteins_species_2'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
37 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
38 #if str($options_type.options_type_selector) == 'advanced':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
39 #if str($set_min_coverage) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
40 --min_coverage $set_min_coverage_cond.min_coverage
2f0b8e19286b Uploaded
greg
parents:
diff changeset
41 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
42 #if str($recalibrate) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
43 --recalibration_rate $recalibrate_cond.recalibration_rate
2f0b8e19286b Uploaded
greg
parents:
diff changeset
44 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
45 #if str($codeml_ctl_file_select) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
46 --codeml_ctl_file '$codeml_ctl_file_cond.codeml_ctl_file'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
47 # No else block needed here because the default codeml_ctl config
2f0b8e19286b Uploaded
greg
parents:
diff changeset
48 # will be used if the --codeml_ctl_file flag is missing.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
49 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
50 #if str($fit_components) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
51 --fit_components
2f0b8e19286b Uploaded
greg
parents:
diff changeset
52 --num_of_components $fit_components_cond.num_of_components
2f0b8e19286b Uploaded
greg
parents:
diff changeset
53 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
54 #if str($set_lower_ks_limit) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
55 --min_ks $set_lower_ks_limit_cond.min_ks
2f0b8e19286b Uploaded
greg
parents:
diff changeset
56 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
57 #if str($set_upper_ks_limit) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
58 --max_ks $set_upper_ks_limit_cond.max_ks
2f0b8e19286b Uploaded
greg
parents:
diff changeset
59 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
60 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
61 >/dev/null
2f0b8e19286b Uploaded
greg
parents:
diff changeset
62 && mv $output_dir/species1.fna '$output_species1_fna'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
63 && mv $output_dir/species1.faa '$output_species1_faa'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
64 #if str($comparison) == 'paralogs':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
65 && mv $output_dir/species1.fna.blastn.paralogs '$output_species1_paralog'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
66 #else:
2f0b8e19286b Uploaded
greg
parents:
diff changeset
67 && mv $output_dir/species2.faa '$output_species2_faa'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
68 && mv $output_dir/species2.fna '$output_species2_fna'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
69 && mv $output_dir/species1.fna.blastn.orthologs '$output_species1_ortholog'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
70 && mv $output_dir/species2.fna.blastn.orthologs '$output_species2_ortholog'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
71 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
72 && mv $output_dir/*.rbhb '$output_rbhb'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
73 && mv $output_dir/*.kaks '$output_kaks'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
74 #if str($fit_components) == 'yes':
2f0b8e19286b Uploaded
greg
parents:
diff changeset
75 && mv $output_dir/*.components '$output_components'
2f0b8e19286b Uploaded
greg
parents:
diff changeset
76 #end if
2f0b8e19286b Uploaded
greg
parents:
diff changeset
77 ]]></command>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
78 <inputs>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
79 <param name="coding_sequences_species_1" format="fasta" type="data" label="Coding sequences for the first species" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
80 <param name="proteins_species_1" format="fasta" type="data" label="Protein sequences for the first species" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
81 <conditional name="comparison_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
82 <param name="comparison" type="select" label="Type of sequence comparison">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
83 <option value="paralogs" selected="true">Paralogous</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
84 <option value="orthologs">Orthologous</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
85 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
86 <when value="paralogs" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
87 <when value="orthologs">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
88 <param name="coding_sequences_species_2" format="fasta" type="data" label="Coding sequences for the second species" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
89 <param name="proteins_species_2" format="fasta" type="data" label="Protein sequences for the second species" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
90 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
91 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
92 <conditional name="options_type">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
93 <param name="options_type_selector" type="select" label="Options Configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
94 <option value="basic" selected="true">Basic</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
95 <option value="advanced">Advanced</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
96 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
97 <when value="basic" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
98 <when value="advanced">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
99 <conditional name="set_min_coverage_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
100 <param name="set_min_coverage" type="select" label="Alignment coverage configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
101 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
102 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
103 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
104 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
105 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
106 <param name="min_coverage" type="float" value="0.5" min="0.3" max="1.0" label="match score" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
107 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
108 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
109 <conditional name="recalibrate_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
110 <param name="recalibrate" type="select" label="Species rates recalibration configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
111 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
112 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
113 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
114 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
115 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
116 <param name="recalibration_rate" type="float" value="0.0" min="0.0" label="Recalibration rate" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
117 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
118 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
119 <conditional name="codeml_ctl_file_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
120 <param name="codeml_ctl_file_select" type="select" label="PAML codeml configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
121 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
122 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
123 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
124 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
125 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
126 <param name="codeml_ctl_file" format="txt" type="data" label="PAML codeml control file" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
127 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
128 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
129 <conditional name="fit_components_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
130 <param name="fit_components" type="select" label="Rates clustering configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
131 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
132 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
133 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
134 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
135 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
136 <param name="num_of_components" type="integer" value="1" min="1" label="Number of components" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
137 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
138 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
139 <conditional name="set_lower_ks_limit_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
140 <param name="set_lower_ks_limit" type="select" label="Lower limit synonymous subsitution rates configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
141 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
142 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
143 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
144 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
145 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
146 <param name="min_ks" type="float" value="0.0" min="0.0" label="Minimum rate" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
147 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
148 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
149 <conditional name="set_upper_ks_limit_cond">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
150 <param name="set_upper_ks_limit" type="select" label="Upper limit synonymous subsitution rates configuration">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
151 <option value="no" selected="true">No</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
152 <option value="yes">Yes</option>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
153 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
154 <when value="no" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
155 <when value="yes">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
156 <param name="max_ks" type="float" value="0.0" min="0.0" label="Maximum rate" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
157 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
158 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
159 </when>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
160 </conditional>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
161 <!-- Required due to the Emmix license -->
2f0b8e19286b Uploaded
greg
parents:
diff changeset
162 <param name="non_commercial_use" label="I certify that I am not using this tool for commercial purposes." type="boolean" truevalue="NON_COMMERCIAL_USE" falsevalue="COMMERCIAL_USE" checked="False">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
163 <validator type="expression" message="This tool is only available for non-commercial use.">value == True</validator>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
164 </param>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
165 </inputs>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
166 <outputs>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
167 <data name="output_species1_fna" format="fasta" label="${tool.name} (coding sequences) on ${on_string}" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
168 <data name="output_species1_faa" format="fasta" label="${tool.name} (amino acids) on ${on_string}" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
169 <data name="output_species2_fna" format="fasta" label="${tool.name} (coding sequences) on ${on_string}">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
170 <filter>comparison_cond['comparison'] == 'orthologs'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
171 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
172 <data name="output_species2_faa" format="fasta" label="${tool.name} (amino acids) on ${on_string}">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
173 <filter>comparison_cond['comparison'] == 'orthologs'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
174 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
175 <data name="output_species1_paralog" format="tabular" label="${tool.name} (blastn results) on ${on_string}">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
176 <filter>comparison_cond['comparison'] == 'paralogs'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
177 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
178 <data name="output_species1_ortholog" format="tabular" label="${tool.name} (blastn results) on ${on_string}">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
179 <filter>comparison_cond['comparison'] == 'orthologs'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
180 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
181 <data name="output_species2_ortholog" format="tabular" label="${tool.name} (blastn results) on ${on_string}">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
182 <filter>comparison_cond['comparison'] == 'orthologs'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
183 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
184 <data name="output_rbhb" format="tabular" label="${tool.name} (paralogous pairs) on ${on_string}" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
185 <data name="output_kaks" format="tabular" label="${tool.name} on ${on_string}" />
1
3aca88613abf Uploaded
greg
parents: 0
diff changeset
186 <data name="output_components" format="ptkscmp" label="${tool.name} (significant components in the ks distribution) on ${on_string}">
0
2f0b8e19286b Uploaded
greg
parents:
diff changeset
187 <filter>options_type['options_type_selector'] == 'advanced' and options_type['fit_components_cond']['fit_components'] == 'yes'</filter>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
188 </data>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
189 </outputs>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
190 <tests>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
191 <test>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
192 <param name="coding_sequences_species_1" value="species1_cds.fasta" ftype="fasta"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
193 <param name="proteins_species_1" value="species1_pep.fasta" ftype="fasta"/>
1
3aca88613abf Uploaded
greg
parents: 0
diff changeset
194 <param name="non_commercial_use" value="True"/>
0
2f0b8e19286b Uploaded
greg
parents:
diff changeset
195 <output name="output_species1_fna" file="species1_cds.fasta" ftype="fasta" compare="contains"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
196 <output name="output_species1_faa" file="species1_pep.fasta" ftype="fasta" compare="contains"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
197 <output name="output_species1_paralog" file="output_blastn_results1.tabular" ftype="tabular" compare="contains"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
198 <output name="output_rbhb" file="output_paralogous_pairs.tabular" ftype="tabular"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
199 <output name="output_kaks" file="output1.tabular" ftype="tabular"/>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
200 </test>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
201 </tests>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
202 <help>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
203 This tool is one of the PlantTribes collection of automated modular analysis pipelines for comparative and evolutionary analyses
2f0b8e19286b Uploaded
greg
parents:
diff changeset
204 of genome-scale gene families and transcriptomes. This tool estimates paralogous and orthologous pairwise synonymous (Ks) and
2f0b8e19286b Uploaded
greg
parents:
diff changeset
205 non-synonymous (Ka) substitution rates for a set of gene coding sequences either produced by the AssemblyPostProcessor tool or
2f0b8e19286b Uploaded
greg
parents:
diff changeset
206 from an external source. Optionally, the resulting set of estimated Ks values can be clustered into components using a mixture
2f0b8e19286b Uploaded
greg
parents:
diff changeset
207 of multivariate normal distributions to identify significant duplication event(s) in a species or a pair of species.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
208
2f0b8e19286b Uploaded
greg
parents:
diff changeset
209 -----
2f0b8e19286b Uploaded
greg
parents:
diff changeset
210
2f0b8e19286b Uploaded
greg
parents:
diff changeset
211 * **Required options**
2f0b8e19286b Uploaded
greg
parents:
diff changeset
212
2f0b8e19286b Uploaded
greg
parents:
diff changeset
213 - **Coding sequences for the first species** - coding sequence fasta file for the first species either produced by the AssemblyPostProcessor tool or from an external source selected from your history.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
214 - **Protein sequences for the first species** - corresponding protein sequence fasta files for the first species either produced by the AssemblyPostProcessor tool or from an external source selected from your history.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
215 - **Type of sequence comparison** - pairwise sequence comparison to determine homologous pairs. This can be either paralogous for self-species comparison or orthologous for cross-species comparison. Cross-species comparison requires input for the second species.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
216
2f0b8e19286b Uploaded
greg
parents:
diff changeset
217 * **Other options**
2f0b8e19286b Uploaded
greg
parents:
diff changeset
218
2f0b8e19286b Uploaded
greg
parents:
diff changeset
219 - **Coding sequences for the second species** - coding sequence fasta file for the second species either produced by the AssemblyPostProcessor tool or from an external source selected from your history. This option is required only for orthologous comparison.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
220 - **Protein sequences for the second species** - corresponding protein sequence fasta files for the second species either produced by the AssemblyPostProcessor tool or from an external source selected from your history. This option is required only for orthologous comparison.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
221 - **Alignment coverage configuration** - select 'Yes' to set the minimum allowable alignment coverage length between homologous pairs. PlantTribes uses global codon alignment match score to determine the pairwise alignment coverage. By default, the match score is set to 0.5 if 'No' is selected.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
222
2f0b8e19286b Uploaded
greg
parents:
diff changeset
223 - **match score** - number of base matches in a pairwise sequence alignment divided by the length of shorter sequence. Positions in the alignment corresponding to gaps are not considered. The score is restricted to the range 0.3 - 1.0.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
224
2f0b8e19286b Uploaded
greg
parents:
diff changeset
225 - **Species rates recalibration configuration** - select 'Yes' to recalibrate synonymous substitution rates of a species using a predetermined evolutionary rate. Recalibration evolutionary rate can be determined from a species tree inferred from a collection of conserved single copy genes from taxa of interest as described in [7]. Rate recalibration applies only to paralogous comparisons.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
226
2f0b8e19286b Uploaded
greg
parents:
diff changeset
227 - **recalibration rate** - a predetermined evolutionary recalibration rate.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
228
2f0b8e19286b Uploaded
greg
parents:
diff changeset
229 - **PAML codeml configuration** - select 'Yes' to enable selection of a PAML codeml control file to carry out maximum likelihood analysis of protein-coding DNA sequences using codon substitution models. Template file "codeml.ctl.args" can be found in the scaffold data installed into Galaxy via the PlantTribes Scaffolds Download Data Manager tool, and are also available at the PlantTribes GitHub `repository`_. Default settings shown in the template are used if 'No' is selected.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
230 - **Rates clustering configuration** - select 'Yes' to estimate clusters of synonymous substitution rates using a mixture of multivariate normal distributions which represent putative duplication event(s).
2f0b8e19286b Uploaded
greg
parents:
diff changeset
231
2f0b8e19286b Uploaded
greg
parents:
diff changeset
232 - **Number of components** - number of components to include in the normal mixture model.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
233
2f0b8e19286b Uploaded
greg
parents:
diff changeset
234 - **Lower limit synonymous substitution rates configuration** - select 'Yes' to set the minimum allowable synonymous substitution rate to use in the normal mixtures cluster analysis to exclude young paralogs that arise from normal gene births and deaths in a genome.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
235
2f0b8e19286b Uploaded
greg
parents:
diff changeset
236 - **Minimum rate** - minimum allowable synonymous substitution rate.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
237
2f0b8e19286b Uploaded
greg
parents:
diff changeset
238 - **Upper limit synonymous substitution rates configuration** - select 'Yes' to set the maximum allowable synonymous substitution rate to use in the normal mixtures cluster analysis to exclude likely ancient paralogs in a genome.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
239
2f0b8e19286b Uploaded
greg
parents:
diff changeset
240 - **Maximum rate** - maximum allowable synonymous substitution rate.
2f0b8e19286b Uploaded
greg
parents:
diff changeset
241
2f0b8e19286b Uploaded
greg
parents:
diff changeset
242 .. _repository: https://github.com/dePamphilis/PlantTribes/blob/master/config/codeml.ctl.args
2f0b8e19286b Uploaded
greg
parents:
diff changeset
243
2f0b8e19286b Uploaded
greg
parents:
diff changeset
244 </help>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
245 <citations>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
246 <expand macro="citation1" />
2f0b8e19286b Uploaded
greg
parents:
diff changeset
247 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
248 @article{Wall2008,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
249 journal = {Nucleic Acids Research},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
250 author = {2. Wall PK, Leebens-Mack J, Muller KF, Field D, Altman NS},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
251 title = {PlantTribes: a gene and gene family resource for comparative genomics in plants},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
252 year = {2008},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
253 volume = {36},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
254 number = {suppl 1},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
255 pages = {D970-D976},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
256 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
257 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
258 @article{Altschul1990,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
259 journal = {Journal of molecular biology}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
260 author = {3. Altschul SF, Gish W, Miller W, Myers EW, Lipman DJ},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
261 title = {Basic local alignment search tool},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
262 year = {1990},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
263 volume = {215},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
264 number = {3},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
265 pages = {403-410},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
266 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
267 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
268 @article{Katoh2013,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
269 journal = {Molecular biology and evolution},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
270 author = {4. Katoh K, Standley DM},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
271 title = {MAFFT multiple sequence alignment software version 7: improvements in performance and usability},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
272 year = {2013},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
273 volume = {30},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
274 number = {4},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
275 pages = {772-780},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
276 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
277 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
278 @article{Yang2007,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
279 journal = {Molecular biology and evolution},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
280 author = {5. Yang Z},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
281 title = {PAML 4: phylogenetic analysis by maximum likelihood},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
282 year = {2007},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
283 volume = {24},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
284 number = {8},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
285 pages = {1586-1591},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
286 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
287 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
288 @article{McLachlan1999,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
289 journal = {Journal of Statistical Software},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
290 author = {6. McLachlan GJ, Peel D, Basford KE, Adams P},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
291 title = {The EMMIX software for the fitting of mixtures of normal and t-components},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
292 year = {1999},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
293 volume = {4},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
294 number = {2},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
295 pages = {1-14},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
296 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
297 <citation type="bibtex">
2f0b8e19286b Uploaded
greg
parents:
diff changeset
298 @article{Cui2006,
2f0b8e19286b Uploaded
greg
parents:
diff changeset
299 journal = {Genome Research},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
300 author = {7. Cui L, Wall PK, Leebens-Mack JH, Lindsay BG, Soltis DE, Doyle JJ, Soltis PS, Carlson JE, Arumuganathan K, Barakat A, Albert VA},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
301 title = {Widespread genome duplications throughout the history of flowering plants},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
302 year = {2006},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
303 volume = {16},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
304 number = {6},
2f0b8e19286b Uploaded
greg
parents:
diff changeset
305 pages = {738-749},}
2f0b8e19286b Uploaded
greg
parents:
diff changeset
306 </citation>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
307 </citations>
2f0b8e19286b Uploaded
greg
parents:
diff changeset
308 </tool>