comparison cmbuild.xml @ 9:1d74ed49cf41 draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/infernal commit 09c1d4ab75f5cd057ed57bf694217f0e355f785e
author bgruening
date Mon, 11 Nov 2024 10:27:19 +0000
parents c9e29ac5d099
children
comparison
equal deleted inserted replaced
8:c9e29ac5d099 9:1d74ed49cf41
2 <description>Build covariance models from sequence alignments</description> 2 <description>Build covariance models from sequence alignments</description>
3 <macros> 3 <macros>
4 <import>macros.xml</import> 4 <import>macros.xml</import>
5 </macros> 5 </macros>
6 <!--parallelism method="multi" split_inputs="alignment_infile" split_mode="to_size" split_size="10" merge_outputs="cmfile_outfile"></parallelism--> 6 <!--parallelism method="multi" split_inputs="alignment_infile" split_mode="to_size" split_size="10" merge_outputs="cmfile_outfile"></parallelism-->
7 <expand macro="xrefs"/>
7 <expand macro="requirements" /> 8 <expand macro="requirements" />
8 <expand macro="stdio" /> 9 <expand macro="stdio" />
9 <expand macro="xrefs"/>
10 <command> 10 <command>
11 <![CDATA[ 11 <![CDATA[
12 cmbuild 12 cmbuild
13 -F 13 -F
14 #if $is_summery_output: 14 #if $is_summery_output:
194 <param name="cyk" type="select" label="Options for refining the input alignment" help=""> 194 <param name="cyk" type="select" label="Options for refining the input alignment" help="">
195 <option value="" selected="true">optimal accuracy algorithm</option> 195 <option value="" selected="true">optimal accuracy algorithm</option>
196 <option value="--cyk">align with the CYK algorithm</option> 196 <option value="--cyk">align with the CYK algorithm</option>
197 </param> 197 </param>
198 198
199 <param name="refine_output" truevalue="" falsevalue="" checked="False" type="boolean" 199 <param name="refine_output" truevalue="--refine" falsevalue="" checked="False" type="boolean"
200 label="Output the refined alignment file as it is used to build the covariance model" help=""/> 200 label="Output the refined alignment file as it is used to build the covariance model" help=""/>
201 201
202 </when> 202 </when>
203 </conditional> 203 </conditional>
204 204
205 <param name="is_summery_output" truevalue="" falsevalue="" checked="False" type="boolean" 205 <param name="is_summery_output" truevalue="-o" falsevalue="" checked="False" type="boolean"
206 label="Output a summery file?" help=""/> 206 label="Output a summery file?" help=""/>
207 207
208 <!-- calibrate options --> 208 <!-- calibrate options -->
209 <conditional name="Calibrate"> 209 <conditional name="Calibrate">
210 <param name="selector" type="boolean" checked="true" label="Calibrate the covariance model" 210 <param name="selector" type="select" label="Calibrate the covariance model"
211 help="A CM file must be calibrated with cmcalibrate before it can be used in cmsearch or cmscan. cmcalibrate is very slow. It takes a couple of hours to calibrate a single average sized CM on a single CPU"/> 211 help="A CM file must be calibrated with cmcalibrate before it can be used in cmsearch or cmscan. cmcalibrate is very slow. It takes a couple of hours to calibrate a single average sized CM on a single CPU">
212 <option value="true">Yes</option>
213 <option value="false">No</option>
214 </param>
212 <when value="false"/> 215 <when value="false"/>
213 <when value="true"> 216 <when value="true">
214 <param argument="-L" type="float" value="1.6" min="0.01" max="160" label="Total length of random sequences to search" help="Set random seq length to search in Mb (megabases)"/> 217 <param argument="-L" type="float" value="1.6" min="0.01" max="160" label="Total length of random sequences to search" help="Set random seq length to search in Mb (megabases)"/>
215 <conditional name="cont_exp_tails_fits" > 218 <conditional name="cont_exp_tails_fits" >
216 <param name="selector" type="select" label="Options controlling exponential tail fits"> 219 <param name="selector" type="select" label="Options controlling exponential tail fits">
323 </data> 326 </data>
324 327
325 </outputs> 328 </outputs>
326 329
327 <tests> 330 <tests>
328 <test> 331 <test expect_num_outputs="1">
329 <param name="alignment_infile" value="cmbuild_input_tRNA5.sto"/> 332 <param name="alignment_infile" value="cmbuild_input_tRNA5.sto"/>
330 <conditional name="Calibrate"> 333 <conditional name="Calibrate">
331 <param name="selector" value="true"/> 334 <param name="selector" value="true"/>
332 <param name="L" value="0.1"/> 335 <param name="L" value="0.1"/>
333 </conditional> 336 </conditional>
336 <has_text text="S 0 -1 0 1 4 0 1 89 109 -7.220 -8.465 -0.063 -4.919"/> 339 <has_text text="S 0 -1 0 1 4 0 1 89 109 -7.220 -8.465 -0.063 -4.919"/>
337 </assert_contents> 340 </assert_contents>
338 </output> 341 </output>
339 </test> 342 </test>
340 <!-- Test emax seq parameter --> 343 <!-- Test emax seq parameter -->
341 <test> 344 <test expect_num_outputs="1">
342 <param name="alignment_infile" value="cmbuild_input_tRNA5.sto"/> 345 <param name="alignment_infile" value="cmbuild_input_tRNA5.sto"/>
343 <conditional name="Calibrate"> 346 <conditional name="Calibrate">
344 <param name="selector" value="true"/> 347 <param name="selector" value="true"/>
345 <param name="L" value="0.1"/> 348 <param name="L" value="0.1"/>
346 </conditional> 349 </conditional>
420 **Options controlling relative weights** 423 **Options controlling relative weights**
421 424
422 425
423 cmbuild uses an ad hoc sequence weighting algorithm to downweight closely related sequences and upweight distantly related ones. This has the effect of making models less biased by uneven phylogenetic representation. For example, two identical sequences would typically each receive half the weight that one sequence would. These options control which algorithm gets used. 426 cmbuild uses an ad hoc sequence weighting algorithm to downweight closely related sequences and upweight distantly related ones. This has the effect of making models less biased by uneven phylogenetic representation. For example, two identical sequences would typically each receive half the weight that one sequence would. These options control which algorithm gets used.
424 427
425 - *--wgb*: Use the Henikoff position-based sequence weighting scheme [Henikoff 428 - *--wgb*: Use the Henikoff position-based sequence weighting scheme [Henikoff and Henikoff, J. Mol. Biol. 243:574, 1994]. This is the default.
426 and Henikoff, J. Mol. Biol. 243:574, 1994]. This is the default.
427 - *--wgsc*: Use the Gerstein/Sonnhammer/Chothia weighting algorithm [Gerstein et al, J. Mol. Biol. 235:1067, 1994]. 429 - *--wgsc*: Use the Gerstein/Sonnhammer/Chothia weighting algorithm [Gerstein et al, J. Mol. Biol. 235:1067, 1994].
428 - *--wnone*: Turn sequence weighting off; e.g. explicitly set all sequence weights to 1.0. 430 - *--wnone*: Turn sequence weighting off; e.g. explicitly set all sequence weights to 1.0.
429 - *--wgiven*: Use sequence weights as given in annotation in the input alignment file. If no weights were given, assume they are all 1.0. The default is to determine new sequence weights by the Gerstein/Sonnhammer/Chothia algorithm, ignoring any annotated weights. 431 - *--wgiven*: Use sequence weights as given in annotation in the input alignment file. If no weights were given, assume they are all 1.0. The default is to determine new sequence weights by the Gerstein/Sonnhammer/Chothia algorithm, ignoring any annotated weights.
430 - *--wblosum*: Use the BLOSUM filtering algorithm to weight the sequences, instead of the default GSC weighting. Cluster the sequences at a given percentage identity (see --wid); assign each cluster a total weight of 1.0, distributed equally amongst the members of that cluster. 432 - *--wblosum*: Use the BLOSUM filtering algorithm to weight the sequences, instead of the default GSC weighting. Cluster the sequences at a given percentage identity (see --wid); assign each cluster a total weight of 1.0, distributed equally amongst the members of that cluster.
431 433