Mercurial > repos > galaxyp > percolator
view nested_collection.xml @ 5:dce55ca21b98 draft
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tools/percolator commit 4fd46e83045d78a4703c0ae7d0cfc396bdbc8e78
author | galaxyp |
---|---|
date | Fri, 19 May 2017 09:01:27 -0400 |
parents | 154147805a33 |
children | 07107a686ce9 |
line wrap: on
line source
<tool id="batched_set_list_creator" name="Create nested list" version="3.3"> <description>based on filenames and batch sizes</description> <stdio> <exit_code range="1:" /> </stdio> <command>python $__tool_directory__/nested_collection.py #if $batchsize --batchsize $batchsize #end if #if len($poolids) > 0 --pool-ids #for $pool in $poolids '${pool.pool_identifier}' #end for #end if --real-names #for $fname in $listtobatch.keys() '$fname' #end for --galaxy-files #for $fname in $listtobatch.keys() '$listtobatch[$fname]' #end for </command> <inputs> <param name="batchsize" type="integer" optional="true" value="" label="Maximal amount of fractions to batch." help="No value means no maximum" /> <param name="filetype" type="select" label="Which datatype to nest?"> <option value="mzid">mzIdentML</option> <option value="percout">Percolator out</option> <option value="tabular">Tabular</option> </param> <repeat name="poolids" title="Batch pools" help="Pools containing batches (optional, not using this will result in one pool)"> <param name="pool_identifier" type="text" label="Filename part identifying batchpool" help="Specify part of the input filenames that are unique for each pool, e.g set_A. Do not use 3 consecutive underscores."/> </repeat> <param name="listtobatch" type="data_collection" collection_type="list" label="List of files to batch" /> </inputs> <outputs> <collection name="batched_fractions_mzid" type="list:list" label="Pooled batched mzIdentML data"> <filter>filetype == "mzid"</filter> <discover_datasets pattern="(?P<identifier_0>\w+[^_][^_][^_])___(?P<identifier_1>[\w.-]+)\.data" ext="mzid" visible="false" /> </collection> <collection name="batched_fractions_perco" type="list:list" label="Pooled batched percolator data"> <filter>filetype == "percout"</filter> <discover_datasets pattern="(?P<identifier_0>\w+[^_][^_][^_])___(?P<identifier_1>[\w.-]+)\.data" ext="percout" visible="false" /> </collection> <collection name="batched_fractions_tab" type="list:list" label="Pooled batched tabular data"> <filter>filetype == "tabular"</filter> <discover_datasets pattern="(?P<identifier_0>\w+[^_][^_][^_])___(?P<identifier_1>[\w.-]+)\.data" ext="tabular" visible="false" /> </collection> </outputs> <tests> <test> <param name="batchsize" value="6"/> <param name="filetype" value="mzid" /> <param name="listtobatch"> <collection type="list"> <element name="fraction_one_spectra.mzML" value="empty_file1.mzid"/> <element name="fraction_two_spectra" value="empty_file2.mzid"/> <element name="fraction_three_spectra" value="empty_file3.mzid"/> <element name="fraction_four_spectra" value="empty_file4.mzid"/> <element name="fraction_five_spectra" value="empty_file5.mzid"/> <element name="fraction_six_spectra" value="empty_file6.mzid"/> <element name="fraction_seven_spectra" value="empty_file7.mzid"/> <element name="fraction_eight_spectra" value="empty_file8.mzid"/> <element name="fraction_nine_spectra" value="empty_file9.mzid"/> <element name="fraction_ten_spectra" value="empty_file10.mzid"/> <element name="fraction_eleven_spectra" value="empty_file11.mzid"/> </collection> </param> <output_collection name="batched_fractions_mzid" type="list:list"> <element name="pool0_batch0"> <element name="inputfn00_fraction_one_spectra.mzML" ftype="mzid" file="empty_file1.mzid"/> <element name="inputfn01_fraction_two_spectra" ftype="mzid" file="empty_file2.mzid"/> <element name="inputfn02_fraction_three_spectra" ftype="mzid" file="empty_file3.mzid"/> <element name="inputfn03_fraction_four_spectra" ftype="mzid" file="empty_file4.mzid"/> <element name="inputfn04_fraction_five_spectra" ftype="mzid" file="empty_file5.mzid"/> <element name="inputfn05_fraction_six_spectra" ftype="mzid" file="empty_file6.mzid"/> </element> <element name="pool0_batch1"> <element name="inputfn06_fraction_seven_spectra" ftype="mzid" file="empty_file7.mzid"/> <element name="inputfn07_fraction_eight_spectra" ftype="mzid" file="empty_file8.mzid"/> <element name="inputfn08_fraction_nine_spectra" ftype="mzid" file="empty_file9.mzid"/> <element name="inputfn09_fraction_ten_spectra" ftype="mzid" file="empty_file10.mzid"/> <element name="inputfn10_fraction_eleven_spectra" ftype="mzid" file="empty_file10.mzid"/> </element> </output_collection> </test> <test> <repeat name="poolids"> <param name="pool_identifier" value="set1"/> </repeat> <repeat name="poolids"> <param name="pool_identifier" value="set2"/> </repeat> <param name="filetype" value="tabular" /> <param name="listtobatch"> <collection type="list"> <element name="fr_one_set1-spectra" value="empty_file1.mzid"/> <element name="fr_two_set1_spectra" value="empty_file2.mzid"/> <element name="fr_three_set1_spectra" value="empty_file3.mzid"/> <element name="fr_four_set1_spectra" value="empty_file4.mzid"/> <element name="fr_five_set1_spectra" value="empty_file5.mzid"/> <element name="fr_six_set1_spectra" value="empty_file6.mzid"/> <element name="fr_seven_set1_spectra" value="empty_file7.mzid"/> <element name="fr_eight_set1_spectra" value="empty_file8.mzid"/> <element name="fr_nine_set1_spectra" value="empty_file9.mzid"/> <element name="fr_ten_set1_spectra" value="empty_file10.mzid"/> <element name="fr_eleven_set1_spectra" value="empty_file11.mzid"/> <element name="fr_one_set2_spectra" value="empty_file12.mzid"/> <element name="fr_two_set2_spectra" value="empty_file13.mzid"/> <element name="fr_three_set2_spectra" value="empty_file14.mzid"/> </collection> </param> <output_collection name="batched_fractions_tab" type="list:list"> <element name="set1_batch0"> <element name="inputfn00_fr_one_set1-spectra" ftype="tabular" file="empty_file1.mzid"/> <element name="inputfn01_fr_two_set1_spectra" ftype="tabular" file="empty_file2.mzid"/> <element name="inputfn02_fr_three_set1_spectra" ftype="tabular" file="empty_file3.mzid"/> <element name="inputfn03_fr_four_set1_spectra" ftype="tabular" file="empty_file4.mzid"/> <element name="inputfn04_fr_five_set1_spectra" ftype="tabular" file="empty_file5.mzid"/> <element name="inputfn05_fr_six_set1_spectra" ftype="tabular" file="empty_file6.mzid"/> <element name="inputfn06_fr_seven_set1_spectra" ftype="tabular" file="empty_file7.mzid"/> <element name="inputfn07_fr_eight_set1_spectra" ftype="tabular" file="empty_file8.mzid"/> <element name="inputfn08_fr_nine_set1_spectra" ftype="tabular" file="empty_file9.mzid"/> <element name="inputfn09_fr_ten_set1_spectra" ftype="tabular" file="empty_file10.mzid"/> <element name="inputfn10_fr_eleven_set1_spectra" ftype="tabular" file="empty_file11.mzid"/> </element> <element name="set2_batch1"> <element name="inputfn0_fr_one_set2_spectra" ftype="tabular" file="empty_file12.mzid"/> <element name="inputfn1_fr_two_set2_spectra" ftype="tabular" file="empty_file13.mzid"/> <element name="inputfn2_fr_three_set2_spectra" ftype="tabular" file="empty_file14.mzid"/> </element> </output_collection> </test> <test> <param name="batchsize" value="2"/> <repeat name="poolids"> <param name="pool_identifier" value="set1"/> </repeat> <repeat name="poolids"> <param name="pool_identifier" value="set2"/> </repeat> <param name="filetype" value="percout" /> <param name="listtobatch"> <collection type="list"> <element name="fr_one_set1_spectra" value="empty_file1.mzid"/> <element name="fr_two_set1_spectra" value="empty_file2.mzid"/> <element name="fr_three_set1_spectra" value="empty_file3.mzid"/> <element name="fr_one_set2_spectra" value="empty_file4.mzid"/> <element name="fr_two_set2_spectra" value="empty_file5.mzid"/> <element name="fr_three_set2_spectra" value="empty_file6.mzid"/> </collection> </param> <output_collection name="batched_fractions_perco" type="list:list"> <element name="set1_batch0"> <element name="inputfn0_fr_one_set1_spectra" ftype="percout" file="empty_file1.mzid"/> <element name="inputfn1_fr_two_set1_spectra" ftype="percout" file="empty_file2.mzid"/> </element> <element name="set1_batch1"> <element name="inputfn2_fr_three_set1_spectra" ftype="percout" file="empty_file3.mzid"/> </element> <element name="set2_batch2"> <element name="inputfn0_fr_one_set2_spectra" ftype="percout" file="empty_file4.mzid"/> <element name="inputfn1_fr_two_set2_spectra" ftype="percout" file="empty_file5.mzid"/> </element> <element name="set2_batch3"> <element name="inputfn2_fr_three_set2_spectra" ftype="percout" file="empty_file6.mzid"/> </element> </output_collection> </test> </tests> <help> Creates nested collection containing from a list containing datasets in batches of a specific size. Useful when e.g. creating inputs to sqt2pin, msgfplus2pin or tandem2pin. Use this feature when you want to batch a specific amount of datasets, or datasets with a common file name pattern, or both. The tool generates a collection containing batches which contain multiple batches of input files. The pools are specified as a pattern in the input files which makes sure the batching isn't continued through very different input sets if that is a problem. Instead, for each filename-pattern it generates batches of the specified size. </help> </tool>