Mercurial > repos > galaxyp > openms_percolatoradapter

diff PercolatorAdapter.xml @ 9:02796e3ddec1 draft default tip
planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/openms commit 5c080b1e2b99f1c88f4557e9fec8c45c9d23b906
author: galaxyp
date: Fri, 14 Jun 2024 21:34:28 +0000
parents: 016964c597f5
--- a/PercolatorAdapter.xml	Thu Dec 01 18:56:56 2022 +0000
+++ b/PercolatorAdapter.xml	Fri Jun 14 21:34:28 2024 +0000
@@ -1,8 +1,7 @@
-<?xml version='1.0' encoding='UTF-8'?>
 <!--This is a configuration file for the integration of a tools into Galaxy (https://galaxyproject.org/). This file was automatically generated using CTDConverter.-->
-<!--Proposed Tool Section: [ID Processing]-->
+<!--Proposed Tool Section: [Identification Processing]-->
 <tool id="PercolatorAdapter" name="PercolatorAdapter" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.05">
-  <description>Facilitate input to Percolator and reintegrate.</description>
+  <description>Facilitate input to Percolator and reintegrate</description>
   <macros>
     <token name="@EXECUTABLE@">PercolatorAdapter</token>
     <import>macros.xml</import>
@@ -18,23 +17,23 @@
   mkdir in_cond.in &&
   #if $in_cond.in_select == "no"
   mkdir ${' '.join(["'in_cond.in/%s'" % (i) for i, f in enumerate($in_cond.in) if f])} && 
-  ${' '.join(["ln -s '%s' 'in_cond.in/%s/%s.%s' && " % (f, i, re.sub('[^\w\-_]', '_', f.element_identifier), $gxy2omsext(f.ext)) for i, f in enumerate($in_cond.in) if f])}
+  ${' '.join(["cp '%s' 'in_cond.in/%s/%s.%s' && " % (f, i, re.sub('[^\w\-_]', '_', f.element_identifier), $gxy2omsext(f.ext)) for i, f in enumerate($in_cond.in) if f])}
   #else
-  ln -s '$in_cond.in' 'in_cond.in/${re.sub("[^\w\-_]", "_", $in_cond.in.element_identifier)}.$gxy2omsext($in_cond.in.ext)' &&
+  cp '$in_cond.in' 'in_cond.in/${re.sub("[^\w\-_]", "_", $in_cond.in.element_identifier)}.$gxy2omsext($in_cond.in.ext)' &&
   #end if
 #end if
 #if $in_decoy_cond.in_decoy:
   mkdir in_decoy_cond.in_decoy &&
   #if $in_decoy_cond.in_decoy_select == "no"
   mkdir ${' '.join(["'in_decoy_cond.in_decoy/%s'" % (i) for i, f in enumerate($in_decoy_cond.in_decoy) if f])} && 
-  ${' '.join(["ln -s '%s' 'in_decoy_cond.in_decoy/%s/%s.%s' && " % (f, i, re.sub('[^\w\-_]', '_', f.element_identifier), $gxy2omsext(f.ext)) for i, f in enumerate($in_decoy_cond.in_decoy) if f])}
+  ${' '.join(["cp '%s' 'in_decoy_cond.in_decoy/%s/%s.%s' && " % (f, i, re.sub('[^\w\-_]', '_', f.element_identifier), $gxy2omsext(f.ext)) for i, f in enumerate($in_decoy_cond.in_decoy) if f])}
   #else
-  ln -s '$in_decoy_cond.in_decoy' 'in_decoy_cond.in_decoy/${re.sub("[^\w\-_]", "_", $in_decoy_cond.in_decoy.element_identifier)}.$gxy2omsext($in_decoy_cond.in_decoy.ext)' &&
+  cp '$in_decoy_cond.in_decoy' 'in_decoy_cond.in_decoy/${re.sub("[^\w\-_]", "_", $in_decoy_cond.in_decoy.element_identifier)}.$gxy2omsext($in_decoy_cond.in_decoy.ext)' &&
   #end if
 #end if
 #if $in_osw:
   mkdir in_osw &&
-  ln -s '$in_osw' 'in_osw/${re.sub("[^\w\-_]", "_", $in_osw.element_identifier)}.$gxy2omsext($in_osw.ext)' &&
+  cp '$in_osw' 'in_osw/${re.sub("[^\w\-_]", "_", $in_osw.element_identifier)}.$gxy2omsext($in_osw.ext)' &&
 #end if
 mkdir out &&
 #if "out_pin_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
@@ -55,15 +54,17 @@
 #if "weights_FLAG" in str($OPTIONAL_OUTPUTS).split(',')
   mkdir weights &&
 #end if
+## advanced options
   #if $adv_opts.init_weights:
     mkdir adv_opts.init_weights &&
-    ln -s '$adv_opts.init_weights' 'adv_opts.init_weights/${re.sub("[^\w\-_]", "_", $adv_opts.init_weights.element_identifier)}.$gxy2omsext($adv_opts.init_weights.ext)' &&
+    cp '$adv_opts.init_weights' 'adv_opts.init_weights/${re.sub("[^\w\-_]", "_", $adv_opts.init_weights.element_identifier)}.$gxy2omsext($adv_opts.init_weights.ext)' &&
   #end if
   #if $adv_opts.fasta:
     mkdir adv_opts.fasta &&
-    ln -s '$adv_opts.fasta' 'adv_opts.fasta/${re.sub("[^\w\-_]", "_", $adv_opts.fasta.element_identifier)}.$gxy2omsext($adv_opts.fasta.ext)' &&
+    cp '$adv_opts.fasta' 'adv_opts.fasta/${re.sub("[^\w\-_]", "_", $adv_opts.fasta.element_identifier)}.$gxy2omsext($adv_opts.fasta.ext)' &&
   #end if
 
+
 ## Main program call
 
 set -o pipefail &&
@@ -116,6 +117,7 @@
   -weights
   'weights/output.${gxy2omsext("tabular")}'
 #end if
+## advanced options
   #if $adv_opts.init_weights:
     -init_weights
     'adv_opts.init_weights/${re.sub("[^\w\-_]", "_", $adv_opts.init_weights.element_identifier)}.$gxy2omsext($adv_opts.init_weights.ext)'
@@ -124,6 +126,7 @@
     -fasta
     'adv_opts.fasta/${re.sub("[^\w\-_]", "_", $adv_opts.fasta.element_identifier)}.$gxy2omsext($adv_opts.fasta.ext)'
   #end if
+
 #if len(str($OPTIONAL_OUTPUTS).split(',')) == 0
   | tee '$stdout'
 #end if
@@ -165,7 +168,7 @@
         <param argument="-in" type="data" format="idxml,mzid" multiple="true" optional="true" label="Input file(s)" help=" select idxml,mzid data sets(s)"/>
       </when>
       <when value="yes">
-        <param argument="-in" type="data" format="idxml,mzid" multiple="false" optional="true" label="Input file(s)" help=" select idxml,mzid data sets(s)"/>
+        <param argument="-in" type="data" format="idxml,mzid" optional="true" label="Input file(s)" help=" select idxml,mzid data sets(s)"/>
       </when>
     </conditional>
     <conditional name="in_decoy_cond">
@@ -177,17 +180,18 @@
         <param argument="-in_decoy" type="data" format="idxml,mzid" multiple="true" optional="true" label="Input decoy file(s) in case of separate searches" help=" select idxml,mzid data sets(s)"/>
       </when>
       <when value="yes">
-        <param argument="-in_decoy" type="data" format="idxml,mzid" multiple="false" optional="true" label="Input decoy file(s) in case of separate searches" help=" select idxml,mzid data sets(s)"/>
+        <param argument="-in_decoy" type="data" format="idxml,mzid" optional="true" label="Input decoy file(s) in case of separate searches" help=" select idxml,mzid data sets(s)"/>
       </when>
     </conditional>
     <param argument="-in_osw" type="data" format="osw" optional="true" label="Input file in OSW format" help=" select osw data sets(s)"/>
-    <param argument="-out_type" display="radio" type="select" optional="false" label="Output file type -- default: determined from file extension or content" help="">
+    <param argument="-out_type" type="select" label="Output file type -- default: determined from file extension or content" help="">
       <option value="idXML">idxml</option>
       <option value="mzid">mzid</option>
       <option value="osw">osw</option>
+      <validator type="expression" message="A value needs to be selected">value != "select a value"</validator>
       <expand macro="list_string_san" name="out_type"/>
     </param>
-    <param argument="-enzyme" type="select" optional="true" label="Type of enzyme: no_enzyme,elastase,pepsin,proteinasek,thermolysin,chymotrypsin,lys-n,lys-c,arg-c,asp-n,glu-c,trypsin,trypsinp" help="">
+    <param argument="-enzyme" type="select" label="Type of enzyme: no_enzyme,elastase,pepsin,proteinasek,thermolysin,chymotrypsin,lys-n,lys-c,arg-c,asp-n,glu-c,trypsin,trypsinp" help="">
       <option value="no_enzyme">no_enzyme</option>
       <option value="elastase">elastase</option>
       <option value="pepsin">pepsin</option>
@@ -205,13 +209,13 @@
     </param>
     <param argument="-peptide_level_fdrs" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Calculate peptide-level FDRs instead of PSM-level FDRs" help=""/>
     <param argument="-protein_level_fdrs" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Use the picked protein-level FDR to infer protein probabilities" help="Use the -fasta option and -decoy_pattern to set the Fasta file and decoy pattern"/>
-    <param argument="-osw_level" type="select" optional="true" label="OSW: the data level selected for scoring" help="">
+    <param argument="-osw_level" type="select" label="OSW: the data level selected for scoring" help="">
       <option value="ms1">ms1</option>
       <option value="ms2" selected="true">ms2</option>
       <option value="transition">transition</option>
       <expand macro="list_string_san" name="osw_level"/>
     </param>
-    <param argument="-score_type" type="select" optional="true" label="Type of the peptide main score" help="">
+    <param argument="-score_type" type="select" label="Type of the peptide main score" help="">
       <option value="q-value" selected="true">q-value</option>
       <option value="pep">pep</option>
       <option value="svm">svm</option>
@@ -219,37 +223,37 @@
     </param>
     <expand macro="adv_opts_macro">
       <param argument="-generic_feature_set" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Use only generic" help="(i.e. not search engine specific) features. Generating search engine specific features for common search engines by PSMFeatureExtractor will typically boost the identification rate significantly"/>
-      <param argument="-subset_max_train" type="integer" optional="true" value="0" label="Only train an SVM on a subset of &lt;x&gt; PSMs, and use the resulting score vector to evaluate the other PSMs" help="Recommended when analyzing huge numbers (&gt;1 million) of PSMs. When set to 0, all PSMs are used for training as normal"/>
-      <param argument="-cpos" type="float" optional="true" value="0.0" label="Cpos, penalty for mistakes made on positive examples" help="Set by cross validation if not specified"/>
-      <param argument="-cneg" type="float" optional="true" value="0.0" label="Cneg, penalty for mistakes made on negative examples" help="Set by cross validation if not specified"/>
-      <param argument="-testFDR" type="float" optional="true" value="0.01" label="False discovery rate threshold for evaluating best cross validation result and the reported end result" help=""/>
-      <param argument="-trainFDR" type="float" optional="true" value="0.01" label="False discovery rate threshold to define positive examples in training" help="Set to testFDR if 0"/>
-      <param argument="-maxiter" type="integer" optional="true" value="10" label="Maximal number of iterations" help=""/>
-      <param argument="-nested_xval_bins" type="integer" optional="true" value="1" label="Number of nested cross-validation bins in the 3 splits" help=""/>
+      <param argument="-subset_max_train" type="integer" value="0" label="Only train an SVM on a subset of &lt;x&gt; PSMs, and use the resulting score vector to evaluate the other PSMs" help="Recommended when analyzing huge numbers (&gt;1 million) of PSMs. When set to 0, all PSMs are used for training as normal"/>
+      <param argument="-cpos" type="float" value="0.0" label="Cpos, penalty for mistakes made on positive examples" help="Set by cross validation if not specified"/>
+      <param argument="-cneg" type="float" value="0.0" label="Cneg, penalty for mistakes made on negative examples" help="Set by cross validation if not specified"/>
+      <param argument="-testFDR" type="float" value="0.01" label="False discovery rate threshold for evaluating best cross validation result and the reported end result" help=""/>
+      <param argument="-trainFDR" type="float" value="0.01" label="False discovery rate threshold to define positive examples in training" help="Set to testFDR if 0"/>
+      <param argument="-maxiter" type="integer" value="10" label="Maximal number of iterations" help=""/>
+      <param argument="-nested_xval_bins" type="integer" value="1" label="Number of nested cross-validation bins in the 3 splits" help=""/>
       <param argument="-quick_validation" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Quicker execution by reduced internal cross-validation" help=""/>
       <param argument="-init_weights" type="data" format="tabular" optional="true" label="Read initial weights to the given file" help=" select tabular data sets(s)"/>
       <param argument="-static" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Use static model (requires init-weights parameter to be set)" help=""/>
       <param argument="-default_direction" type="text" optional="true" value="" label="The most informative feature given as the feature name, can be negated to indicate that a lower value is bette" help="">
         <expand macro="list_string_san" name="default_direction"/>
       </param>
-      <param argument="-verbose" type="integer" optional="true" value="2" label="Set verbosity of output: 0=no processing info, 5=all" help=""/>
+      <param argument="-verbose" type="integer" value="2" label="Set verbosity of output: 0=no processing info, 5=all" help=""/>
       <param argument="-unitnorm" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Use unit normalization [0-1] instead of standard deviation normalization" help=""/>
       <param argument="-test_each_iteration" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Measure performance on test set each iteration" help=""/>
       <param argument="-override" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Override error check and do not fall back on default score vector in case of suspect score vecto" help=""/>
-      <param argument="-seed" type="integer" optional="true" value="1" label="Setting seed of the random number generato" help=""/>
-      <param argument="-doc" type="integer" optional="true" value="0" label="Include description of correct features" help=""/>
+      <param argument="-seed" type="integer" value="1" label="Setting seed of the random number generato" help=""/>
+      <param argument="-doc" type="integer" value="0" label="Include description of correct features" help=""/>
       <param argument="-klammer" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Retention time features calculated as in Klammer et al" help="Only available if -doc is set"/>
       <param argument="-fasta" type="data" format="fasta" optional="true" label="Provide the fasta file as the argument to this flag, which will be used for protein grouping based on an in-silico digest (only valid if option -protein_level_fdrs is active)" help=" select fasta data sets(s)"/>
-      <param argument="-decoy_pattern" type="text" optional="true" value="random" label="Define the text pattern to identify the decoy proteins and/or PSMs, set this up if the label that identifies the decoys in the database is not the default (Only valid if option -protein_level_fdrs is active)" help="">
+      <param argument="-decoy_pattern" type="text" value="random" label="Define the text pattern to identify the decoy proteins and/or PSMs, set this up if the label that identifies the decoys in the database is not the default (Only valid if option -protein_level_fdrs is active)" help="">
         <expand macro="list_string_san" name="decoy_pattern"/>
       </param>
       <param argument="-post_processing_tdc" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Use target-decoy competition to assign q-values and PEPs" help=""/>
       <param argument="-train_best_positive" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Enforce that, for each spectrum, at most one PSM is included in the positive set during each training iteration" help="If the user only provides one PSM per spectrum, this filter will have no effect"/>
-      <param argument="-ipf_max_peakgroup_pep" type="float" optional="true" value="0.7" label="OSW/IPF: Assess transitions only for candidate peak groups until maximum posterior error probability" help=""/>
-      <param argument="-ipf_max_transition_isotope_overlap" type="float" optional="true" value="0.5" label="OSW/IPF: Maximum isotope overlap to consider transitions in IPF" help=""/>
-      <param argument="-ipf_min_transition_sn" type="float" optional="true" value="0.0" label="OSW/IPF: Minimum log signal-to-noise level to consider transitions in IPF" help="Set -1 to disable this filter"/>
+      <param argument="-ipf_max_peakgroup_pep" type="float" value="0.7" label="OSW/IPF: Assess transitions only for candidate peak groups until maximum posterior error probability" help=""/>
+      <param argument="-ipf_max_transition_isotope_overlap" type="float" value="0.5" label="OSW/IPF: Maximum isotope overlap to consider transitions in IPF" help=""/>
+      <param argument="-ipf_min_transition_sn" type="float" value="0.0" label="OSW/IPF: Minimum log signal-to-noise level to consider transitions in IPF" help="Set -1 to disable this filter"/>
       <param argument="-force" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Overrides tool-specific checks" help=""/>
-      <param argument="-test" type="hidden" optional="true" value="False" label="Enables the test mode (needed for internal use only)" help="">
+      <param argument="-test" type="hidden" value="False" label="Enables the test mode (needed for internal use only)" help="" optional="true">
         <expand macro="list_string_san" name="test"/>
       </param>
     </expand>
@@ -292,7 +296,8 @@
       <filter>OPTIONAL_OUTPUTS is not None and "ctd_out_FLAG" in OPTIONAL_OUTPUTS</filter>
     </data>
   </outputs>
-  <tests><!-- TOPP_PercolatorAdapter_1 -->
+  <tests>
+    <!-- TOPP_PercolatorAdapter_1 -->
     <test expect_num_outputs="2">
       <section name="adv_opts">
         <param name="generic_feature_set" value="false"/>
@@ -325,7 +330,7 @@
       <conditional name="in_cond">
         <param name="in" value="PercolatorAdapter_1.idXML"/>
       </conditional>
-      <output name="out" file="PercolatorAdapter_1_out.idXML" compare="sim_size" delta_frac="0.7" ftype="idxml"/>
+      <output name="out" value="PercolatorAdapter_1_out.idXML" compare="sim_size" delta_frac="0.7" ftype="idxml"/>
       <param name="out_type" value="idXML"/>
       <param name="enzyme" value="trypsin"/>
       <param name="peptide_level_fdrs" value="false"/>
@@ -338,6 +343,9 @@
           <is_valid_xml/>
         </assert_contents>
       </output>
+      <assert_stdout>
+        <has_text_matching expression="@EXECUTABLE@ took .* \(wall\), .* \(CPU\), .* \(system\), .* \(user\)(; Peak Memory Usage: 32 MB)?."/>
+      </assert_stdout>
     </test>
     <!-- TOPP_PercolatorAdapter_2 -->
     <test expect_num_outputs="2">
@@ -370,7 +378,7 @@
         <param name="test" value="true"/>
       </section>
       <param name="in_osw" value="PercolatorAdapter_2.osw"/>
-      <output name="out" file="PercolatorAdapter_2_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
+      <output name="out" value="PercolatorAdapter_2_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
       <param name="out_type" value="osw"/>
       <param name="enzyme" value="trypsin"/>
       <param name="peptide_level_fdrs" value="false"/>
@@ -383,6 +391,9 @@
           <is_valid_xml/>
         </assert_contents>
       </output>
+      <assert_stdout>
+        <has_text_matching expression="@EXECUTABLE@ took .* \(wall\), .* \(CPU\), .* \(system\), .* \(user\)(; Peak Memory Usage: 32 MB)?."/>
+      </assert_stdout>
     </test>
     <!-- TOPP_PercolatorAdapter_3 -->
     <test expect_num_outputs="2">
@@ -415,7 +426,7 @@
         <param name="test" value="true"/>
       </section>
       <param name="in_osw" value="PercolatorAdapter_2_out1.osw"/>
-      <output name="out" file="PercolatorAdapter_3_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
+      <output name="out" value="PercolatorAdapter_3_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
       <param name="out_type" value="osw"/>
       <param name="enzyme" value="trypsin"/>
       <param name="peptide_level_fdrs" value="false"/>
@@ -428,6 +439,9 @@
           <is_valid_xml/>
         </assert_contents>
       </output>
+      <assert_stdout>
+        <has_text_matching expression="@EXECUTABLE@ took .* \(wall\), .* \(CPU\), .* \(system\), .* \(user\)(; Peak Memory Usage: 32 MB)?."/>
+      </assert_stdout>
     </test>
     <!-- TOPP_PercolatorAdapter_4 -->
     <test expect_num_outputs="2">
@@ -460,7 +474,7 @@
         <param name="test" value="true"/>
       </section>
       <param name="in_osw" value="PercolatorAdapter_3_out1.osw"/>
-      <output name="out" file="PercolatorAdapter_4_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
+      <output name="out" value="PercolatorAdapter_4_out1.osw" compare="sim_size" delta_frac="0.7" ftype="osw"/>
       <param name="out_type" value="osw"/>
       <param name="enzyme" value="trypsin"/>
       <param name="peptide_level_fdrs" value="false"/>
@@ -473,6 +487,9 @@
           <is_valid_xml/>
         </assert_contents>
       </output>
+      <assert_stdout>
+        <has_text_matching expression="@EXECUTABLE@ took .* \(wall\), .* \(CPU\), .* \(system\), .* \(user\)(; Peak Memory Usage: 32 MB)?."/>
+      </assert_stdout>
     </test>
     <!-- TOPP_PercolatorAdapter_5 -->
     <test expect_num_outputs="3">
@@ -507,8 +524,8 @@
       <conditional name="in_cond">
         <param name="in" value="PercolatorAdapter_1.idXML"/>
       </conditional>
-      <output name="out" file="PercolatorAdapter_1_out.idXML" compare="sim_size" delta_frac="0.7" ftype="idxml"/>
-      <output name="out_pin" file="PercolatorAdapter_1_out1.tsv" compare="sim_size" delta_frac="0.7" ftype="tabular"/>
+      <output name="out" value="PercolatorAdapter_1_out.idXML" compare="sim_size" delta_frac="0.7" ftype="idxml"/>
+      <output name="out_pin" value="PercolatorAdapter_1_out1.tsv" compare="sim_size" delta_frac="0.7" ftype="tabular"/>
       <param name="out_type" value="idXML"/>
       <param name="enzyme" value="trypsin"/>
       <param name="peptide_level_fdrs" value="false"/>
@@ -521,11 +538,14 @@
           <is_valid_xml/>
         </assert_contents>
       </output>
+      <assert_stdout>
+        <has_text_matching expression="@EXECUTABLE@ took .* \(wall\), .* \(CPU\), .* \(system\), .* \(user\)(; Peak Memory Usage: 32 MB)?."/>
+      </assert_stdout>
     </test>
   </tests>
   <help><![CDATA[Facilitate input to Percolator and reintegrate.
 
 
-For more information, visit http://www.openms.de/doxygen/release/2.8.0/html/TOPP_PercolatorAdapter.html]]></help>
+For more information, visit https://openms.de/doxygen/release/3.1.0/html/TOPP_PercolatorAdapter.html]]></help>
   <expand macro="references"/>
 </tool>
author	galaxyp
date	Fri, 14 Jun 2024 21:34:28 +0000
parents	016964c597f5
children