# HG changeset patch # User galaxyp # Date 1371662144 14400 # Node ID 1183846e70a1c812ea212a994b7a5ac38739c40d # Parent 8fa16707e16275d5f88a618aab850ff23f0da6b3 Uploaded diff -r 8fa16707e162 -r 1183846e70a1 feature_linker_unlabeled.xml --- a/feature_linker_unlabeled.xml Fri May 10 17:31:59 2013 -0400 +++ b/feature_linker_unlabeled.xml Wed Jun 19 13:15:44 2013 -0400 @@ -1,4 +1,4 @@ - + Groups corresponding features from multiple maps. @@ -12,23 +12,31 @@ [simple_options] -in=$input1 +in=${",".join(map(str, $inputs))} out=$output +#if $type.input_type == "consensusxml" +$keep_subelements +#end if +$ignore_charge +$use_identifications +algorithm!second_nearest_gap=$second_nearest_gap +algorithm!distance_RT!max_difference=$rt_max_difference +algorithm!distance_MZ!max_difference=$mz_max_difference +algorithm!distance_MZ!unit=$mz_max_difference_unit +#if $advanced.specify +algorithm!distance_RT!weight=$advanced.rt_weight +algorithm!distance_MZ!weight=$advanced.mz_weight +algorithm!distance_intensity!weight=$advanced.intensity_weight +algorithm!distance_RT!exponent=$advanced.rt_exponent +algorithm!distance_MZ!exponent=$advanced.mz_exponent +algorithm!distance_intensity!exponent=$advanced.intensity_exponent +#end if - - - - - - - - - - - - + + + diff -r 8fa16707e162 -r 1183846e70a1 feature_linker_unlabeled_qt.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/feature_linker_unlabeled_qt.xml Wed Jun 19 13:15:44 2013 -0400 @@ -0,0 +1,58 @@ + + + Groups corresponding features from multiple maps using a QT clustering approach. + + + macros.xml + + + + + openms_wrapper.py --executable 'FeatureLinkerUnlabeledQT' --config $config + + + [simple_options] +in=${",".join(map(str, $inputs))} +out=$output +#if $type.input_type == "consensusxml" +$keep_subelements +#end if +$ignore_charge +$use_identifications +algorithm!distance_RT!max_difference=$rt_max_difference +algorithm!distance_MZ!max_difference=$mz_max_difference +algorithm!distance_MZ!unit=$mz_max_difference_unit +#if $advanced.specify +algorithm!distance_RT!weight=$advanced.rt_weight +algorithm!distance_MZ!weight=$advanced.mz_weight +algorithm!distance_intensity!weight=$advanced.intensity_weight +algorithm!distance_RT!exponent=$advanced.rt_exponent +algorithm!distance_MZ!exponent=$advanced.mz_exponent +algorithm!distance_intensity!exponent=$advanced.intensity_exponent +#end if + + + + + + + + + + + +**What it does** + +This tool provides an algorithm for grouping corresponding features in multiple runs of label-free experiments. For more details and algorithm-specific parameters (set in the INI file) see "Detailed Description" in the algorithm documentation or the INI file table below. + +FeatureLinkerUnlabeled takes several feature maps (featureXML files) and stores the corresponding features in a consensus map (consensusXML file). Feature maps can be created from MS experiments (peak data) using one of the FeatureFinder TOPP tools. + +Advanced users can convert the consensusXML generated by this tool to EDTA using FileConverter and plot the distribution of distances in RT (or m/z) between different input files (can be done in Excel). The distribution should be Gaussian-like with very few points beyond the tails. Points far away from the Gaussian indicate a too wide tolerance. A Gaussian with its left/right tail trimmed indicates a too narrow tolerance. + +**Citation** + +For the underlying tool, please cite ``Weisser et al.: An automated pipeline for high-throughput label-free quantitative proteomics (J. Proteome Res., 2013, PMID: 23391308).`` + +If you use this tool in Galaxy, please cite Chilton J, et al. https://bitbucket.org/galaxyp/galaxyp-toolshed-openms + + diff -r 8fa16707e162 -r 1183846e70a1 id_file_converter.xml --- a/id_file_converter.xml Fri May 10 17:31:59 2013 -0400 +++ b/id_file_converter.xml Wed Jun 19 13:15:44 2013 -0400 @@ -13,7 +13,6 @@ [simple_options] in=${in} -in_type=${in.ext} out=${out} out_type=${output_type} @@ -21,18 +20,18 @@ - - + + - + - + - + diff -r 8fa16707e162 -r 1183846e70a1 idxml_to_tabular.xml --- a/idxml_to_tabular.xml Fri May 10 17:31:59 2013 -0400 +++ b/idxml_to_tabular.xml Wed Jun 19 13:15:44 2013 -0400 @@ -14,23 +14,18 @@ [simple_options] in=${in} out=${out} -#if $dump_type == "protein" -proteins_only=true -#end if -#if $dump_type == "pepetide" -peptides_only=true -#end if -$extra_rt +$dump_type +id!first_dim_rt=$extra_rt - - - + + + - + diff -r 8fa16707e162 -r 1183846e70a1 isobaric_analyzer.xml --- a/isobaric_analyzer.xml Fri May 10 17:31:59 2013 -0400 +++ b/isobaric_analyzer.xml Wed Jun 19 13:15:44 2013 -0400 @@ -1,4 +1,4 @@ - + Extracts and normalizes iTRAQ/TMT information from an MS experiment. diff -r 8fa16707e162 -r 1183846e70a1 macros.xml --- a/macros.xml Fri May 10 17:31:59 2013 -0400 +++ b/macros.xml Wed Jun 19 13:15:44 2013 -0400 @@ -80,4 +80,64 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + \ No newline at end of file diff -r 8fa16707e162 -r 1183846e70a1 map_aligner_identification.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/map_aligner_identification.xml Wed Jun 19 13:15:44 2013 -0400 @@ -0,0 +1,86 @@ + + + Corrects retention time distortions between maps based on common peptide identifications. + + + macros.xml + + + + + openms_wrapper.py --executable 'MapAlignerIdentification' --config $config + + + [simple_options] +#set $inputs_as_str = ",".join(map(str, $type.input)) +in=$inputs_as_str +out=@MULTI_OUTPUT($output.extra_files_path,$inputs_as_str)@ +#if $generate_transformations +trafo_out=@MULTI_OUTPUT($transformations.extra_files_path,$inputs_as_str)@ +#end if +algorithm!peptide_score_threshold=$peptide_score_threshold +algorithm!min_run_occur=$min_run_occur +algorithm!max_rt_shift=$max_rt_shift +algorithm!use_unassigned_peptides=$use_unassigned_peptides +algorithm!use_feature_rt=$use_feature_rt +#set $model_type = $model.model_type +model!type=$model_type +#if $model_type == "interpolated" +model!interpolated!interpolation_type=$model.interpolation_type +#end if + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + generate_transformations + + + +**What it does** + +This tool provides an algorithm to align the retention time scales of multiple input files, correcting shifts and distortions between them. Retention time adjustment may be necessary to correct for chromatography differences e.g. before data from multiple LC-MS runs can be combined (feature grouping), or when one run should be annotated with peptide identifications obtained in a different run. + +All map alignment tools (MapAligner...) collect retention time data from the input files and - by fitting a model to this data - compute transformations that map all runs to a common retention time scale. + +The map alignment tools differ in how they obtain retention time data for the modeling of transformations, and consequently what types of data they can be applied to. The alignment algorithm implemented here is based on peptide identifications, and thus applicable to files containing peptide IDs (idXML, annotated featureXML/consensusXML). It finds peptide sequences that different input files have in common and uses them as points of correspondence between the inputs. + +Note that alignment is based on the sequence including modifications, thus an exact match is required. I.e., a peptide with oxidised methionine will not be matched to its unmodified version. For some applications this behaviour is desired, while for others its not, but you can always remove all modifications from the input files if you want to ignore modifications. + +**Citation** + +For the underlying tool, please cite ``Weisser et al.: An automated pipeline for high-throughput label-free quantitative proteomics (J. Proteome Res., 2013, PMID: 23391308).`` + +If you use this tool in Galaxy, please cite Chilton J, et al. https://bitbucket.org/galaxyp/galaxyp-toolshed-openms + + diff -r 8fa16707e162 -r 1183846e70a1 map_aligner_spectrum.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/map_aligner_spectrum.xml Wed Jun 19 13:15:44 2013 -0400 @@ -0,0 +1,64 @@ + + + Corrects retention time distortions between maps by aligning spectra. + + + macros.xml + + + + + openms_wrapper.py --executable 'MapAlignerSpectrum' --config $config + + + [simple_options] +#set $inputs_as_str = ",".join(map(str, $input)) +in=$inputs_as_str +out=@MULTI_OUTPUT($output.extra_files_path,$inputs_as_str)@ +#if $generate_transformations +trafo_out=@MULTI_OUTPUT($transformations.extra_files_path,$inputs_as_str)@ +#end if +algorithm!gapcost=$gapcost +algorithm!affinegapcost=$affinegapcost +algorithm!scorefunction=$scorefunction +#set $model_type = $model.model_type +model!type=$model_type +#if $model_type == "interpolated" +model!interpolated!interpolation_type=$model.interpolation_type +#end if + + + + + + + + + + + + + + + + + + generate_transformations + + + +**What it does** + +This tool provides an algorithm to align the retention time scales of multiple input files, correcting shifts and distortions between them. Retention time adjustment may be necessary to correct for chromatography differences e.g. before data from multiple LC-MS runs can be combined (feature grouping), or when one run should be annotated with peptide identifications obtained in a different run. + +All map alignment tools (MapAligner...) collect retention time data from the input files and - by fitting a model to this data - compute transformations that map all runs to a common retention time scale. They can apply the transformations right away and return output files with aligned time scales (parameter out), and/or return descriptions of the transformations in trafoXML format (parameter trafo_out). Transformations stored as trafoXML can be applied to arbitrary files with the MapRTTransformer tool. + +The map alignment tools differ in how they obtain retention time data for the modeling of transformations, and consequently what types of data they can be applied to. Here, an experimental algorithm based on spectrum alignment is implemented. It is only applicable to peak maps (mzML format). + +**Citation** + +For the underlying tool, please cite ``Weisser et al.: An automated pipeline for high-throughput label-free quantitative proteomics (J. Proteome Res., 2013, PMID: 23391308).`` + +If you use this tool in Galaxy, please cite Chilton J, et al. https://bitbucket.org/galaxyp/galaxyp-toolshed-openms + + diff -r 8fa16707e162 -r 1183846e70a1 omssa_adapter.xml --- a/omssa_adapter.xml Fri May 10 17:31:59 2013 -0400 +++ b/omssa_adapter.xml Wed Jun 19 13:15:44 2013 -0400 @@ -7,7 +7,7 @@ omssa - + blast+ openms_wrapper.py diff -r 8fa16707e162 -r 1183846e70a1 openms_wrapper.py --- a/openms_wrapper.py Fri May 10 17:31:59 2013 -0400 +++ b/openms_wrapper.py Wed Jun 19 13:15:44 2013 -0400 @@ -71,10 +71,10 @@ required: _fail("Failed to find specific OpenMS option [%s] in node [%s]" % (key, node)) else: - if not node: + if node is None: _fail("Failed to find specific OpenMS option [%s] in node [%s]" % (key, node)) sub_node = node.find("./NODE[@name='%s']" % key) - if not sub_node: + if sub_node is None: _fail("Failed to find node for key %s" % key) _set_option(sub_node, key_parts[1:], value, required) @@ -145,8 +145,16 @@ return None +def _mapped_outputs(output_directory, inputs): + inputs = inputs.split(",") + os.makedirs(output_directory) + outputs = [os.path.join(output_directory, os.path.basename(input)) for input in inputs] + return ",".join(outputs) + + VALUE_FUNCTIONS = {compile(r"\@WHICH$(.*)$\@"): _which, compile(r"\@PEPNOVO_MODELS_PATH\@"): _get_pepnovo_models_path, + compile(r"\@MULTI_OUTPUT$([^,]*),(.*)$\@"): _mapped_outputs, } diff -r 8fa16707e162 -r 1183846e70a1 peptide_indexer.xml --- a/peptide_indexer.xml Fri May 10 17:31:59 2013 -0400 +++ b/peptide_indexer.xml Wed Jun 19 13:15:44 2013 -0400 @@ -16,9 +16,7 @@ fasta=$database out=$output decoy_string=$decoy_string -#if $decoy_string_position == "prefix" -prefix=true -#end if +prefix=$prefix $extact_search $write_protein_sequence $keep_unreferenced_proteins @@ -29,9 +27,9 @@ - - - + + + diff -r 8fa16707e162 -r 1183846e70a1 protein_inference.xml --- a/protein_inference.xml Fri May 10 17:31:59 2013 -0400 +++ b/protein_inference.xml Wed Jun 19 13:15:44 2013 -0400 @@ -8,7 +8,7 @@ - openms_wrapper.py --executable 'PeptideIndexer' --config $config + openms_wrapper.py --executable 'ProteinInference' --config $config [simple_options] diff -r 8fa16707e162 -r 1183846e70a1 protein_quantifier.xml --- a/protein_quantifier.xml Fri May 10 17:31:59 2013 -0400 +++ b/protein_quantifier.xml Wed Jun 19 13:15:44 2013 -0400 @@ -23,7 +23,18 @@ - + + + + + + + + + + + + @@ -32,7 +43,7 @@ - + diff -r 8fa16707e162 -r 1183846e70a1 silac_analyzer.xml --- a/silac_analyzer.xml Fri May 10 17:31:59 2013 -0400 +++ b/silac_analyzer.xml Wed Jun 19 13:15:44 2013 -0400 @@ -27,7 +27,6 @@ - @@ -46,17 +45,6 @@ -