Mercurial > repos > galaxyp > percolator
diff nested_collection.xml @ 1:86770eea5b09 draft
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tools/percolator commit 0a5f9eb82877545be1c924357e585b17e01cfd1c
author | galaxyp |
---|---|
date | Sat, 04 Mar 2017 20:36:03 -0500 |
parents | |
children | 7a0951d0e13e |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/nested_collection.xml Sat Mar 04 20:36:03 2017 -0500 @@ -0,0 +1,137 @@ +<tool id="batched_set_list_creator" name="Create nested list" version="3.0.1"> + <description>based on filenames and batch sizes</description> + <stdio> + <exit_code range="1:" /> + </stdio> + <command>python $__tool_directory__/nested_collection.py + #if $batchsize + --batchsize $batchsize + #end if + #if len($poolids) > 0 + --pool-ids + #for $pool in $poolids + '${pool.pool_identifier}' + #end for + #end if + --real-names + #for $fname in $listtobatch.keys() + '$fname' + #end for + --galaxy-files + #for $fname in $listtobatch.keys() + '$listtobatch[$fname]' + #end for + </command> + <inputs> + <param name="batchsize" type="integer" optional="true" value="" label="Maximal amount of fractions to batch." help="No value means no maximum" /> + <repeat name="poolids" title="Batch pools" help="Pools containing batches (optional, not using this will result in one pool)"> + <param name="pool_identifier" type="text" label="Filename part identifying batchpool" + help="Specify part of the input filenames that are unique for each pool, e.g set_A. Do not use 3 consecutive underscores."/> + </repeat> + <param name="listtobatch" type="data_collection" collection_type="list" label="List of files to batch" /> + </inputs> + <outputs> + <collection name="batched_fractions" type="list:list" label="Pooled batched data"> + <discover_datasets pattern="[a-zA-z0-9_]*___(?P<identifier_0>[^_]+)_(?P<identifier_1>[^_]+)\.mzid" ext="mzid" visible="true" /> + </collection> + </outputs> + <tests> + <test> + <param name="batchsize" value="2"/> + <param name="listtobatch"> + <collection type="list"> + <element name="fraction_one_spectra" value="empty_file1.mzid"/> + <element name="fraction_two_spectra" value="empty_file2.mzid"/> + <element name="fraction_three_spectra" value="empty_file3.mzid"/> + <element name="fraction_four_spectra" value="empty_file4.mzid"/> + </collection> + </param> + <output_collection name="batched_fractions" type="list:list"> + <element name="batch0"> + <element name="inputfn0" file="empty_file1.mzid"/> + <element name="inputfn1" file="empty_file2.mzid"/> + </element> + <element name="batch1"> + <element name="inputfn0" file="empty_file3.mzid"/> + <element name="inputfn1" file="empty_file4.mzid"/> + </element> + </output_collection> + </test> + <test> + <repeat name="poolids"> + <param name="pool_identifier" value="set1"/> + </repeat> + <repeat name="poolids"> + <param name="pool_identifier" value="set2"/> + </repeat> + <param name="listtobatch"> + <collection type="list"> + <element name="fr_one_set1_spectra" value="empty_file1.mzid"/> + <element name="fr_two_set1_spectra" value="empty_file2.mzid"/> + <element name="fr_three_set1_spectra" value="empty_file3.mzid"/> + <element name="fr_one_set2_spectra" value="empty_file4.mzid"/> + <element name="fr_two_set2_spectra" value="empty_file5.mzid"/> + <element name="fr_three_set2_spectra" value="empty_file6.mzid"/> + </collection> + </param> + <output_collection name="batched_fractions" type="list:list"> + <element name="batch0"> + <element name="inputfn0" file="empty_file1.mzid"/> + <element name="inputfn1" file="empty_file2.mzid"/> + <element name="inputfn2" file="empty_file3.mzid"/> + </element> + <element name="batch1"> + <element name="inputfn0" file="empty_file4.mzid"/> + <element name="inputfn1" file="empty_file5.mzid"/> + <element name="inputfn2" file="empty_file6.mzid"/> + </element> + </output_collection> + </test> + <test> + <param name="batchsize" value="2"/> + <repeat name="poolids"> + <param name="pool_identifier" value="set1"/> + </repeat> + <repeat name="poolids"> + <param name="pool_identifier" value="set2"/> + </repeat> + <param name="listtobatch"> + <collection type="list"> + <element name="fr_one_set1_spectra" value="empty_file1.mzid"/> + <element name="fr_two_set1_spectra" value="empty_file2.mzid"/> + <element name="fr_three_set1_spectra" value="empty_file3.mzid"/> + <element name="fr_one_set2_spectra" value="empty_file4.mzid"/> + <element name="fr_two_set2_spectra" value="empty_file5.mzid"/> + <element name="fr_three_set2_spectra" value="empty_file6.mzid"/> + </collection> + </param> + <output_collection name="batched_fractions" type="list:list"> + <element name="batch0"> + <element name="inputfn0" file="empty_file1.mzid"/> + <element name="inputfn1" file="empty_file2.mzid"/> + </element> + <element name="batch1"> + <element name="inputfn0" file="empty_file3.mzid"/> + </element> + <element name="batch2"> + <element name="inputfn0" file="empty_file4.mzid"/> + <element name="inputfn1" file="empty_file5.mzid"/> + </element> + <element name="batch3"> + <element name="inputfn0" file="empty_file6.mzid"/> + </element> + </output_collection> + </test> + </tests> + <help> + Creates nested collection containing from a list containing datasets in batches of + a specific size. Useful when e.g. creating inputs to sqt2pin, msgfplus2pin or tandem2pin. + Use this feature when you want to batch a specific amount of datasets, or datasets with + a common file name pattern, or both. + The tool generates a collection containing batches which contain multiple batches + of input files. The pools are specified as a pattern in the input + files which makes sure the batching isn't continued through very different input sets + if that is a problem. Instead, for each filename-pattern it generates batches of the + specified size. + </help> +</tool>