annotate quantifere.xml @ 28:6107b74eeb11 default tip

improved documentation
author pieter.lukasse@wur.nl
date Fri, 30 Jan 2015 14:53:10 +0100
parents 5215b5cfdc53
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
17
40ec8770780d * Added support for pepxml (and more specifically for
pieter.lukasse@wur.nl
parents: 6
diff changeset
1 <tool name="Quantifere" id="quantifere1" version="1.0.3">
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
2 <description>Protein Inference by Peptide Quantification patterns</description>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
3 <!--
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
4 For remote debugging start you listener on port 8000 and use the following as command interpreter:
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
5 java -jar -Xdebug -Xrunjdwp:transport=dt_socket,address=D0100564.wurnet.nl:8000
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
6 //////////////////////////
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
7 -->
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
8 <command interpreter="java -jar ">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
9 Quantifere.jar
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
10 -annotatedQuantificationFilesList $annotatedQuantificationFilesList
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
11 -identificationFilesList $identificationFilesList
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
12 -statisticalMeasuresConfigFile $statisticalMeasuresConfigFile
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
13 -quantificationDataToUse $quantificationDataToUse
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
14 -minCorrel $minCorrel
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
15 -minProtCoverage $minProtCoverage
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
16 -minAboveAverageHits $minAboveAverageHits
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
17 -minNrIdsForInferencePeptide $minNrIdsForInferencePeptide
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
18 -refineModel $refineModel
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
19 -functionalAnnotationCSV $functionalAnnotationCSV
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
20 -outputCSV $outputCSV
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
21 -outputInferenceLogCSV $outputInferenceLogCSV
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
22 -outputSummaryAnnotationCSV $outputSummaryAnnotationCSV
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
23 -outReport $htmlReportFile
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
24 -outReportPicturesPath $htmlReportFile.files_path
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
25 #if $is2D_LC_MS.fractions == True
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
26 -namingConventionCodesForFractions $is2D_LC_MS.namingConventionCodesForFractions
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
27 #end if
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
28 </command>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
29
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
30 <inputs>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
31
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
32 <repeat name="annotatedQuantificationFiles" title="Peptide (filtered) quantification files (APML)"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
33 help="The APML contents as aligned, annotated and scored feature lists,
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
34 as produced by MsFilt tool. Select one or more files. For 2D-LC-MS we expect one file per fraction.">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
35 <param name="annotatedQuantificationFile" size="50" type="data" format="apml" label="File (APML format)" />
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
36 </repeat>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
37
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
38 <repeat name="identificationFiles" title="Peptide (filtered) identification files (MS/MS identifications)"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
39 help="Full set of MS/MS peptide identification files, including peptides that could not be quantified.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
40 This set of identifications is ideally filtered on some quality and
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
41 statistical measures (e.g. as is done by MsFilt). Tip: to base the inference only on the
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
42 selected peptide quantification files, you
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
43 can select the same quantification files here as well. Select one or more files.">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
44 <param name="identificationFile" size="50" type="data" format="apml,mzid" label="File (APML or MZIDENTML format)" />
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
45 </repeat>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
46
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
47 <conditional name="is2D_LC_MS">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
48 <param name="fractions" type="boolean" truevalue="Yes" falsevalue="No" checked="false"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
49 label="Data is from 2D LC-MS"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
50 help="Data acquisition was done in multiple fractions."/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
51 <when value="Yes">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
52 <param name="namingConventionCodesForFractions" type="text" size="100" value=""
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
53 label="Part of run/file name that identifies the 2D LC-MS fraction"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
54 help="Add the CSV list of codes that occur in the file names
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
55 and that stand for a fraction code. E.g. '_F1,_F2,_F3,etc.' In this
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
56 way different peptide identifications from the same sample but measured
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
57 in different fractions can be merged together. Otherwise each (fraction) file
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
58 is seen as a separate sample."/> <!-- could do regular expressions as well but this would be hard for biologists, e.g. _F\d\b -->
19
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
59 <!-- on help above: the given codes are removed from source name...separate features are clustered, not peptides, peptides
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
60 are quantified based on summing features (raw), or summing patterns : TODO document the quantification columns present in the output CSV -->
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
61 </when>
6
d1edc7971d48 fixes in tool forms (<when> tags)
pieter.lukasse@wur.nl
parents: 4
diff changeset
62 <when value="No">
d1edc7971d48 fixes in tool forms (<when> tags)
pieter.lukasse@wur.nl
parents: 4
diff changeset
63 </when>
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
64 </conditional>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
65
17
40ec8770780d * Added support for pepxml (and more specifically for
pieter.lukasse@wur.nl
parents: 6
diff changeset
66 <param name="statisticalMeasuresConfig" type="text" area="true" size="8x70" label="Statistical measures configuration"
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
67 help="Here you may specify the statistical measures that are found in the ms/ms results (e.g. p or e-values).
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
68 The format is: SM alias => SM name,type,mode[min/max]. Leaving this configuration out while these are present in the
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
69 dataset will have the effect that they will be wrongly used as a regular scoring scheme, having effect on for example
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
70 the filter criteria below like 'Minimum number of peptide matches with a score above average' ."
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
71 value="smXTD =&gt; MS:1001330,XSLASH!Tandem:expect,min
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
72 &#xd;&#xa;pvCSVEX =&gt; p_value,CSV_EXPORT,min
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
73 &#xd;&#xa;smAUTO_LIKELIHOOD =&gt; AUTOMOD_LOGLIKELIHOOD,PLGS/Auto-mod,max
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
74 &#xd;&#xa;smLIKELIHOOD =&gt; LOGLIKELIHOOD,PLGS/Databank-search,max
17
40ec8770780d * Added support for pepxml (and more specifically for
pieter.lukasse@wur.nl
parents: 6
diff changeset
75 &#xd;&#xa;smPercoProb =&gt; Percolator: probability,Percolator probability,max
40ec8770780d * Added support for pepxml (and more specifically for
pieter.lukasse@wur.nl
parents: 6
diff changeset
76 &#xd;&#xa;smPercoPEP =&gt; Percolator: PEP,Percolator PEP,min
40ec8770780d * Added support for pepxml (and more specifically for
pieter.lukasse@wur.nl
parents: 6
diff changeset
77 &#xd;&#xa;smPercoQval =&gt; Percolator: q-Value,Percolator q-Value,max
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
78 "/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
79 <!-- keep value attribute above aligned like this to avoid white spaces in the value -->
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
80 <param name="quantificationDataToUse" type="select"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
81 label="Quantification data to use"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
82 help="Quantification data to use for the pattern clustering and inference steps. NB: check if the chosen data is also
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
83 present in your file, or choose 'auto' to let Quantifere check which quantification type is present in most peptides.">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
84 <option value="auto" selected="true">auto</option>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
85 <option value="getIntensity">(TODO)raw intensities</option>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
86 <option value="getApexIntensity">(TODO)apex intensities</option>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
87 <option value="getNormalizedIntensity">(TODO)normalized intensities</option>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
88 </param>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
89 <!-- TODO let minCorrel default value vary according to quantification type chosen above -->
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
90 <param name="minCorrel" type="float" size="10" value="0.85" label="Minimum correlation in a cluster" help="Features will be grouped by their protein annotation and
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
91 sample intensity values correlation. Set here the minimum correlation expected between grouped members. This is used to guide the clustering algorithm."/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
92
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
93 <!-- simple extra heuristics to remove some "noise" protein hits -->
19
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
94 <param name="minProtCoverage" type="float" size="10" value="0.0" label="Minimum protein coverage (%)" help="Set this to e.g. 5.0 if you have protein coverage
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
95 information in your data. This will remove proteins that have a too small portion of their sequence covered by peptide matches."/>
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
96 <!-- TODO : ADD warning to report if this is left 0 and no coverage is found ...or maybe validate the other way around-->
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
97
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
98 <param name="minAboveAverageHits" type="integer" size="10" value="1" label="Minimum number of different peptide matches with a score above average"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
99 help="This will remove proteins that do not have enough reasonable peptides hits."/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
100
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
101 <param name="minNrIdsForInferencePeptide" type="integer" size="10" value="1" label="Minimum number of peptide identifications for inference peptides"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
102 help="Minimum number of peptide identifications a peptide needs to be used as inference peptide for secondary proteins."/>
19
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
103 <!-- currently, when one feature clusters with foreign peptide, then it is not inference peptide anymore...quite strict, could be less strict
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
104 by letting user indicate for example: 90% of features should be inference features...then it is an inference pep. See QuantifereTool.inferSecondaryProteins() -->
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
105
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
106 <param name="functionalAnnotationCSV" type="data" format="csv,txt,tsv" optional="true"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
107 label="(Functional)annotation mapping file (csv or tsv format)"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
108 help="Optional file that maps protein accessions to a network, pathway or other higher level annotations. In this file a header line is expected with these 2 columns (names and lower case is important): accession,annotation"/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
109
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
110 <param name="refineModel" type="boolean" checked="true" label="Refine matches model"
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
111 help="This will let the algorithm search for a reduced set of secondary protein matches that still explains the variation in the peptide quantification patterns"/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
112
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
113
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
114 <param name="summaryReport" type="boolean" checked="true" label="Generate summary report"/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
115
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
116 </inputs>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
117 <configfiles>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
118 <configfile name="annotatedQuantificationFilesList">## start comment
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
119 ## iterate over the selected files and store their names in the config file
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
120 #for $i, $s in enumerate( $annotatedQuantificationFiles )
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
121 ${s.annotatedQuantificationFile}
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
122 #end for
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
123 ## end comment</configfile>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
124
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
125 <configfile name="identificationFilesList">## start comment
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
126 ## iterate over the selected files and store their names in the config file
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
127 #for $i, $s in enumerate( $identificationFiles )
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
128 ${s.identificationFile}
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
129 ## also print out the datatype in the next line, based on previously configured datatype
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
130 #if isinstance( $s.identificationFile.datatype, $__app__.datatypes_registry.get_datatype_by_extension('apml').__class__):
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
131 apml
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
132 #else:
25
5215b5cfdc53 workaround
pieter.lukasse@wur.nl
parents: 19
diff changeset
133 apml
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
134 #end if
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
135 #end for
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
136 ## end comment</configfile>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
137 <configfile name="statisticalMeasuresConfigFile">## start comment
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
138 ${statisticalMeasuresConfig}
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
139 </configfile>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
140 </configfiles>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
141 <outputs>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
142 <data name="outputCSV" format="csv" label="${tool.name} on ${on_string}: Proteins list (CSV)" />
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
143 <data name="outputInferenceLogCSV" format="csv" label="${tool.name} on ${on_string}: Inference log (CSV)"/>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
144 <data name="htmlReportFile" format="html" label="${tool.name} on ${on_string} - HTML report">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
145 <!-- If the expression is false, the file is not created -->
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
146 <filter>( summaryReport == True )</filter>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
147 </data>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
148 <data name="outputSummaryAnnotationCSV" format="csv" label="${tool.name} on ${on_string} - Functional annotation summary (CSV)">
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
149 <!-- If the expression is false, the file is not created -->
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
150 <filter>( functionalAnnotationCSV != None )</filter>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
151 </data>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
152 </outputs>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
153 <tests>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
154 </tests>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
155 <help>
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
156
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
157 .. class:: infomark
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
158
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
159 This tool takes Peptide Quantification patterns and uses this to do Protein Inference of both Primary Protein
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
160 identifications as well as Secondary Protein identifications. This last class of protein identifications
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
161 can not be done by traditional protein inference methods that look only at peptide identifications and
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
162 their quality parameters.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
163
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
164
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
165 -----
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
166
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
167 **List of definitions**
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
168
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
169 Primary Protein identification: protein identification belonging to the minimum set of proteins needed
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
170 to account for the observed peptides.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
171
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
172 Secondary Protein identification: extra protein identifications that do not below to the minimum set
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
173 of proteins mentioned above.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
174
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
175 raw intensities : is the intensity value resulting from the integration of the feature peak area
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
176
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
177 apex intensities: is the intensity value as on the highest point of the feature peak
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
178
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
179 normalized intensities : is the intensity normalized by some means
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
180
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
181 -----
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
182
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
183 **Minimum correlation in a cluster**
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
184
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
185 TODO - add doc.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
186
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
187 -----
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
188
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
189 **Output details**
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
190
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
191 *Proteins list (CSV)*
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
192
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
193 This is the list of primary and secondary proteins and their calculated inference score. Proteins
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
194 with exactly the same peptide hits are also grouped together and labeled as primary_group and secondary_group
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
195 instead of simply primary and secondary.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
196
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
197
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
198 *Inference log (CSV)*
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
199
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
200 This CSV table shows all data, both inferred and ruled out proteins. This can be used by the user to
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
201 troubleshoot the inference process and understand why certain proteins might have been ruled out.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
202 The CSV is provided in such a format that the data can easily be explored in a Cytoscape network.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
203
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
204 The figure below shows an example of the data being explored in Cytoscape using also the
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
205 `Cytoscape chartplugin`_ to visualize the quantification data when selecting the peptide nodes.
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
206
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
207 .. image:: $PATH_TO_IMAGES/quantifere_cyto_out.png
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
208
4
73c7c6589202 small fixes
pieter.lukasse@wur.nl
parents: 0
diff changeset
209 .
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
210
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
211 .. _Cytoscape chartplugin: http://apps.cytoscape.org/apps/chartplugin
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
212
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
213
19
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
214 **References**
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
215
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
216 If you use this Galaxy tool in work leading to a scientific publication please
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
217 cite the following papers:
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
218
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
219 Pieter N. J. Lukasse and Antoine H. P. America (2014).
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
220 Protein Inference Using Peptide Quantification Patterns.
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
221 http://dx.doi.org/10.1021/pr401072g
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
222
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
223
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
224 </help>
19
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
225 <citations>
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
226 <citation type="doi">10.1021/pr401072g</citation> <!-- example
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
227 see also https://wiki.galaxyproject.org/Admin/Tools/ToolConfigSyntax#A.3Ccitations.3E_tag_set
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
228 -->
d31c6978d9d0 fixes for NapQ
pieter.lukasse@wur.nl
parents: 17
diff changeset
229 </citations>
0
d50f079096ee Push to main toolshed
pieter.lukasse@wur.nl
parents:
diff changeset
230 </tool>