changeset 11:618d74240c7f draft

Uploaded
author iracooke
date Mon, 16 Jun 2014 05:47:55 -0400
parents ffd1d25b8080
children f9271f6991b1
files README README.md repository_dependencies.xml tandem.xml tandem_to_pepxml.xml tool-data/pepxml_databases.loc.sample tool-data/tandem_mods.loc.sample
diffstat 7 files changed, 233 insertions(+), 31 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/README	Mon Jun 16 05:47:55 2014 -0400
@@ -0,0 +1,6 @@
+Galaxy wrapper for running the X!Tandem search engine and converting results to pepXML
+
+Requirements:
+This package uses protk and the trans_proteomic_pipeline. These must be installed separately. 
+
+For instructions please see: https://github.com/iracooke/protk/#galaxy-integration
\ No newline at end of file
--- a/README.md	Mon Jun 16 05:47:38 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,6 +0,0 @@
-## What is it?
-Galaxy tool definition file and wrapper scripts for the [X!Tandem search engine](http://www.thegpm.org/tandem/index.html).
-
-## This tool requires that the protk rubygem and X!Tandem itself are installed.
-
-
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml	Mon Jun 16 05:47:55 2014 -0400
@@ -0,0 +1,4 @@
+<?xml version="1.0"?>
+<repositories description="Proteomics datatypes">
+    <repository changeset_revision="f66f8ca7b7b9" name="proteomics_datatypes" owner="iracooke" toolshed="http://toolshed.g2.bx.psu.edu" />
+ </repositories>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tandem.xml	Mon Jun 16 05:47:55 2014 -0400
@@ -0,0 +1,204 @@
+<tool id="proteomics_search_tandem_1" name="X!Tandem MSMS Search" version="1.0.2">
+
+   <requirements>
+	    <requirement type="package" version="1.3.0">protk</requirement>
+   </requirements>
+
+	<description>Run an X!Tandem Search</description>
+
+	<command>
+		#if $database.source_select=="built_in":
+		tandem_search.rb -d $database.dbkey 
+		#else 
+		tandem_search.rb -d $database.fasta_file
+		#end if
+
+		#if $tandem_params.source_select=="built_in":
+		-T $tandem_params.paramskey 
+		#else 
+		-T $tandem_params.params_file
+		#end if
+
+
+		--var-mods='
+		$variable_mods
+		#for $custom_variable_mod in $custom_variable_mods:
+		,${custom_variable_mod.custom_mod}
+		#end for
+		'
+
+		--fix-mods='
+		$fixed_mods
+		#for $custom_fix_mod in $custom_fix_mods:
+		,${custom_fix_mod.custom_mod}
+		#end for
+		'
+
+		$input_file -o $output -r 
+
+		--enzyme=$enzyme 
+
+		--precursor-ion-tol-units=$precursor_tolu 
+
+		-v $missed_cleavages 
+
+		-f $fragment_ion_tol 
+
+		-p $precursor_ion_tol 
+
+		$allow_multi_isotope_search 
+
+		$acetyl_protein_nterm
+
+		$cleavage_semi
+
+		$keep_spectra
+
+		--threads $threads
+		
+	</command>
+
+	<inputs>
+		<conditional name="database">
+			<param name="source_select" type="select" label="Database source">
+				<option value="built_in">Built-In</option>
+				<option value="input_ref" selected="true">Your Upload File</option>
+			</param>
+			<when value="built_in">
+				<param name="dbkey" type="select" format="text" >
+					<label>Database</label>
+					<options from_file="pepxml_databases.loc">
+						<column name="name" index="0" />
+						<column name="value" index="2" />
+					</options>
+				</param>
+			</when>
+			<when value="input_ref">
+				<param name="fasta_file" type="data" format="fasta" label="Uploaded FASTA file" />
+			</when>
+		</conditional>
+		
+		<conditional name="tandem_params">
+			<param name="source_select" type="select" label="Baseline Parameters">
+				<option value="built_in" selected="true">Built-In</option>
+				<option value="input_ref">Custom parameter file</option>
+			</param>
+			<when value="built_in">
+				<param name="paramskey" type="select" format="text" >
+					<label>Paramset</label>
+				    <option value="isb_native">ISB Native</option>		
+					<option value="isb_kscore">ISB K-Score</option>
+				</param>
+			</when>
+			<when value="input_ref">
+				<param name="params_file" type="data" format="xml" label="Custom X!Tandem Parameters" />
+			</when>
+		</conditional>
+
+		<param name="input_file" type="data" format="mzml,mgf" multiple="false" label="MSMS File" help="A file with MS/MS data"/>
+
+		<param name="variable_mods" format="text" type="select" multiple="true" label="Variable Modifications" help="Hold the appropriate key while
+			clicking to select multiple items">
+			<options from_file="tandem_mods.loc">
+				<column name="name" index="0" />
+				<column name="value" index="2" />
+			</options>
+		</param>
+
+		<repeat name="custom_variable_mods" title="Custom Variable Modifications" help="You can specify a modification when present in a motif. For instance, 0.998@N!{P}[ST] is a deamidation modification on N only if it is present in an N[any but P][S or T] motif (N-glycosite).">
+			<param name="custom_mod" type="text">
+			</param>
+		</repeat>
+		
+		
+		<param name="fixed_mods" format="text" type="select" multiple="true" label="Fixed Modifications" help="Hold the appropriate key while
+			clicking to select multiple items">
+			<options from_file="tandem_mods.loc">
+				<column name="name" index="0" />
+				<column name="value" index="2" />
+			</options>
+		</param>
+
+		<repeat name="custom_fix_mods" title="Custom Fixed Modifications" help="You can specify a modification when present in a motif. For instance, 0.998@N!{P}[ST] is a deamidation modification on N only if it is present in an N[any but P][S or T] motif (N-glycosite).">
+			<param name="custom_mod" type="text">
+			</param>
+		</repeat>
+
+		<param name="acetyl_protein_nterm" type="boolean" label="Allow N-terminal protein acetylation as a variable modification" truevalue="-y" falsevalue="" />		
+		
+
+		<param name="missed_cleavages" type="select" format="text" help="Allow peptides to contain up to this many missed enzyme cleavage sites">
+			<label>Missed Cleavages Allowed</label>
+		    <option value="0">0</option>		
+			<option value="1">1</option>
+			<option value="2">2</option>
+		</param>
+
+		<param name="cleavage_semi" type="boolean" label="Allow semi-cleaved peptides" help="This can increase search time dramatically" truevalue="--cleavage-semi" falsevalue=""/>
+
+		<param name="keep_spectra" type="boolean" label="Keep Spectra" help="Include spectra in the output" truevalue="--output-spectra" falsevalue=""/>
+
+		<param name="threads" type="integer" value="1" label="Threads" help="Number of threads to use for search. Maximum is 16"/>
+		
+		<param name="enzyme" type="select" format="text">
+		    <label>Enzyme</label>
+			<option value="[R]|{P}">argc - [R]|{P}</option>
+			<option value="[X]|[D]">aspn - [X]|[D]</option>
+			<option value="[FLMWY]|{P}">chymotrypsin - [FLMWY]|{P}</option>
+			<option value="[R]|[X]">clostripain - [R]|[X]</option>
+			<option value="[M]|{P}">cnbr - [M]|{P}</option>
+			<option value="[AGILV]|{P}">elastase - [AGILV]|{P}</option>
+			<option value="[D]|{P}">formicacid - [D]|{P}</option>
+			<option value="[DE]|{P}">gluc - [DE]|{P}</option>
+			<option value="[E]|{P}">gluc_bicarb - [E]|{P}</option>
+			<option value="[W]|[X]">iodosobenzoate - [W]|[X]</option>
+			<option value="[K]|{P}">lysc - [K]|{P}</option>
+			<option value="[K]|[X]">lysc-p - [K]|[X]</option>
+			<option value="[X]|[K]">lysn - [X]|[K]</option>
+			<option value="[X]|[AKRS]">lysn_promisc - [X]|[AKRS]</option>
+			<option value="[X]|[X]">nonspecific - [X]|[X]</option>
+			<option value="[FL]|[X]">pepsina - [FL]|[X]</option>
+			<option value="[P]|[X]">protein_endopeptidase - [P]|[X]</option>
+			<option value="[E]|[X]">staph_protease - [E]|[X]</option>
+			<option value="[FMWY]|{P},[KR]|{P},[X]|[D]">tca - [FMWY]|{P},[KR]|{P},[X]|[D]</option>
+			<option value="[KR]|{P}" selected="true">trypsin - [KR]|{P}</option>
+			<option value="[FKLMRWY]|{P}">trypsin/chymotrypsin - [FKLMRWY]|{P}</option>
+			<option value="[KR]|{P},[M]|{P}">trypsin/cnbr - [KR]|{P},[M]|{P}</option>
+			<option value="[DEKR]|{P}">trypsin_gluc - [DEKR]|{P}</option>
+		</param>
+
+		
+		<param name="fragment_ion_tol" help="Fragment Ion Tolerance in Daltons" type="float" value="0.65" min="0" max="10000" label="Fragment ion tolerance"/>
+
+		<param name="precursor_ion_tol" help="Precursor Ion Tolerance (Da or ppm)" type="float" value="100" min="0" max="10000" label="Precursor ion tolerance"/>
+		<param name="precursor_tolu" type="select" format="text">
+		    <label>Precursor Ion Tolerance Units</label>
+		    <option value="ppm">ppm</option>		
+			<option value="Da">Da</option>
+		</param>
+		
+		<param name="allow_multi_isotope_search" type="boolean" label="Allow multi-isotope search" help="This allows peptide candidates in windows around -1 Da and -2 Da from the acquired mass to be considered. Only applicable when the minus/plus window above is set to less than 0.5 Da. Good for accurate-mass instruments for which the reported precursor mass is not corrected to the monoisotopic mass." truevalue="" falsevalue=""/>
+
+	</inputs>
+
+
+	<outputs>
+		<data format="tandem" name="output" metadata_source="input_file" label="X!Tandem_vs_${database.dbkey if $database.has_key('dbkey') else $database.fasta_file.display_name}.${input_file.display_name}.${input_file.display_name}.tandem"/>
+	</outputs>
+
+
+  <help>
+
+**What it does**
+
+Runs an MS/MS database search using the X!Tandem search engine. Output is in the form of a pepXML file containing identified peptides along with their raw search scores.
+
+----
+
+**References**
+
+Please see http://www.thegpm.org/GPM/references.html for details of references describing the X!Tandem search engine.
+
+  </help>
+
+</tool>
--- a/tandem_to_pepxml.xml	Mon Jun 16 05:47:38 2014 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,25 +0,0 @@
-<tool id="tandem_to_pepxml_1" name="Tandem to pepXML" version="1.0.1">
-	<requirements>
-	    <requirement type="package" version="1.3.0">protk</requirement>
-	    <requirement type="package" version="4.6.3">trans_proteomic_pipeline</requirement>
-   </requirements>
-
-  <description>Converts a tandem result file to pepXML</description>
-
-<command>
-	tandem_to_pepxml.rb $input_file -o $output 
-</command>
-
-<inputs>
-	<param name="input_file" type="data" format="tandem" multiple="false" label="Input File" help="X!Tandem results file"/>
-</inputs>
-
-<outputs>
-	<data format="raw_pepxml" metadata_source="input_file" name="output" label="${input_file.display_name}.pepXML" />
-</outputs>
-
-<help>
-	Convert X!Tandem results to pepXML
-</help>
-
-</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/pepxml_databases.loc.sample	Mon Jun 16 05:47:55 2014 -0400
@@ -0,0 +1,13 @@
+#This file lists the names of protein databases installed locally in protk. 
+# These are used by omssa and x!tandem as well as the "mascot to pepxml" tool
+# In order to combine search results with Interprophet searches must be run against an identical database
+#
+# Entries should follow the be structured as follows
+# Display_name omssa_tandem_dbname dbkey
+#
+#
+Swissprot	spall_	spall	spall_
+Combined PlasmboDB (falciparum) and Swissprot Human	plasmodb_pfalciparum_sphuman_	plasmodb_pfalciparum_sphuman	plasmodb_pfalciparum_sphuman_
+Swissprot Human	sphuman_	sphuman	sphuman_
+Combined Swissprot/TRembl Human	sptrhuman_	sptrhuman	sptrhuman_
+Swissprot Mouse	spmouse_	spmouse	spmouse_
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/tandem_mods.loc.sample	Mon Jun 16 05:47:55 2014 -0400
@@ -0,0 +1,6 @@
+#This file lists the names of inbuilt chemical modifications accepted by X!Tandem
+#
+#
+Carbamidomethyl C	carbamidomethyl_c_	57.021464@C	carbamidomethyl_c_
+Glycocapture-N	glycocapture_n_	0.998@N!{P}[ST]	glycocapture_n_
+Oxidation M	oxidation_m_	15.994915@M	oxidation_m_
\ No newline at end of file