annotate hammock.xml @ 1:d90f4809ccc6 draft

Uploaded
author hammock
date Fri, 28 Aug 2015 07:38:12 -0400
parents b1ac138f0287
children 4db310b7e37c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
1 <tool id="hammock_1.0" name="Hammock - cluster peptides" version="1.0.2" hidden="false">
0
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
2
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
3 <description>Clusters short peptide sequences</description>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
4
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
5 <command interpreter="bash">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
6 wrapper.sh \$HAMMOCK_JAR full --galaxy -t \${GALAXY_SLOTS:-4} -i $input --goc $output_clusters --gos $output_sequences
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
7
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
8 #if $label_params.set_labels == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
9 #for $s in $label_params.round_labels:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
10 #set $l_field = $l_field + str($s.label) + ","
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
11 #end for
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
12 -l $l_field
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
13 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
14
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
15 #if $advanced_greedy_params.set_greedy_params == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
16 -x $advanced_greedy_params.max_shift
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
17 -p $advanced_greedy_params.shift_penalty
1
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
18 -R $advanced_greedy_params.set_order.order
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
19
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
20 #if $advanced_greedy_params.set_order.order == "random":
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
21 -S $advanced_greedy_params.set_order.seed
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
22 #end if
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
23
0
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
24 -m \${MATRIX_PATH}${advanced_greedy_params.scoring_matrix}.txt
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
25 #if $advanced_greedy_params.greedy_params.set_greedy == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
26 -g $advanced_greedy_params.greedy_params.greedy_threshold
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
27 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
28 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
29
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
30 #if $advanced_hmm_params.set_hmm_params == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
31 #if $advanced_hmm_params.threshold_params.clustering_threshold == "part":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
32 -a $advanced_hmm_params.threshold_params.part_threshold
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
33 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
34
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
35 #if $advanced_hmm_params.threshold_params.clustering_threshold == "size":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
36 -s $advanced_hmm_params.threshold_params.size_threshold
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
37 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
38
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
39 #if $advanced_hmm_params.threshold_params.clustering_threshold == "count":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
40 -c $advanced_hmm_params.threshold_params.count_threshold
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
41 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
42
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
43 #set $n_field=""
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
44 #set $v_field=""
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
45 #set $r_field=""
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
46
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
47 #if $advanced_hmm_params.score_params.set_scores == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
48 #if $advanced_hmm_params.score_params.relative_scores == "relative":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
49 -e
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
50 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
51 #if $advanced_hmm_params.score_params.relative_scores == "absolute":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
52 -b
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
53 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
54
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
55 #for $s in $advanced_hmm_params.score_params.round:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
56 #set $n_field = $n_field + str($s.assign_score) + ","
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
57 #set $v_field = $v_field + str($s.overlap_score) + ","
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
58 #set $r_field = $r_field + str($s.merge_score) + ","
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
59 #end for
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
60
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
61 -n $n_field
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
62 -v $v_field
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
63 -r $r_field
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
64 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
65 #set $l_field=""
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
66
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
67 #if $advanced_hmm_params.match_state_params.set_max_aln_length == "set":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
68 -j $advanced_hmm_params.match_state_params.max_aln_length
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
69 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
70
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
71 #if $advanced_hmm_params.extension_increase_length == "Yes":
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
72 -q
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
73 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
74
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
75 -k $advanced_hmm_params.min_ic
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
76 -y $advanced_hmm_params.max_gap_proportion
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
77 -u $advanced_hmm_params.max_inner_gaps
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
78 -h $advanced_hmm_params.min_match_states
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
79 #end if
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
80
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
81 </command>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
82
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
83 <inputs>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
84 <param format="fasta" name="input" type="data" label="Source sequence file" help="File with sequences to cluster in fasta format. See -i, --input in manual for details." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
85
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
86 <conditional name="label_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
87 <param name="set_labels" type="select" label="Specify a subset of labels to be used" help="Set Automatic to use all labels present in the data or choose a subset of labels to be used. See -l, --labels in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
88 <option value="auto">Automatic - all labels</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
89 <option value="set">Set list of labels manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
90 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
91 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
92 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
93 <repeat name="round_labels" title="Label">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
94 <param name="label" type="text" value="" label="Sequence label"/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
95 </repeat>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
96 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
97 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
98
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
99
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
100 <conditional name="advanced_greedy_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
101 <param name="set_greedy_params" type="select" label="Greedy clustering options">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
102 <option value="auto">Default - automatic settings</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
103 <option value="set">Set manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
104 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
105 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
106 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
107
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
108 <param name="max_shift" type="integer" value="3" min="0" label="Maximal sequence shift" help="Maximal number of positions sequences are allowed to shift for during greedy clustering. See -x, --max shift in manual for details." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
109
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
110 <param name="shift_penalty" type="integer" value="0" label="Sequence shift penalty" help="Score penalty added to to each alignment score during greedy clustering. This penalty is added for every amino acid aligned towards a (trailing) gap. This value should typically be non-positive (With a positive value, sequences benefit from containing more gaps). See -p, --gap penalty in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
111
1
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
112 <conditional name="set_order">
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
113
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
114 <param name="order" type="select" label="Greedy clustering order" help="Select the order of sequences during the greedy clustering. See -R, --order in manual for details.">
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
115 <option value="size">Size</option>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
116 <option value="alphabetic">Alphabetic</option>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
117 <option value="random">Random</option>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
118 </param>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
119
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
120 <when value="size" />
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
121 <when value="alphabetic" />
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
122 <when value="random">
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
123 <param name="seed" type="integer" value="42" label="Seed for random number generation" help="Set a seed value for the pseudorandom sequence order. See -S, --seed in manual for details."/>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
124 </when>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
125
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
126 </conditional>
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
127
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
128
d90f4809ccc6 Uploaded
hammock
parents: 0
diff changeset
129
0
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
130 <param name="scoring_matrix" type="select" label="Substitiution matrix schema." help="Select a substitution matrix to be used to score alignments during glreedy clustering. See -m, --matrix in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
131 <option value="blosum62">Blosum 62</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
132 <option value="blosum30">Blosum 30</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
133 <option value="blosum35">Blosum 35</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
134 <option value="blosum40">Blosum 40</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
135 <option value="blosum45">Blosum 45</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
136 <option value="blosum50">Blosum 50</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
137 <option value="blosum55">Blosum 55</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
138 <option value="blosum60">Blosum 60</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
139 <option value="blosum65">Blosum 65</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
140 <option value="blosum70">Blosum 70</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
141 <option value="blosum75">Blosum 75</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
142 <option value="blosum80">Blosum 80</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
143 <option value="blosum85">Blosum 85</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
144 <option value="blosum90">Blosum 90</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
145 <option value="blosum100">Blosum 100</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
146 <option value="gonnet250">Gonnet 250</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
147 <option value="pam250">Pam 250</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
148 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
149
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
150 <conditional name="greedy_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
151 <param name="set_greedy" type="select" label="Set greedy clustering threshold" help="Minimal alignment score needed for a sequence to join a cluster during greedy clustering. Can be either user defined or set automatically based on mean sequence length. See -g, --greedy threshold in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
152 <option value="auto">Auto detection</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
153 <option value="set">Set manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
154 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
155 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
156 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
157 <param name="greedy_threshold" type="integer" value="24" min="0" label="Greedy clustering threshold" help="Minimal alignment score needed for a sequence to join a cluster during greedy clustering." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
158 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
159 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
160
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
161 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
162 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
163
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
164 <conditional name="advanced_hmm_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
165 <param name="set_hmm_params" type="select" label="HMM-clustering options">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
166 <option value="auto">Default - automatic settings</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
167 <option value="set">Set manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
168 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
169 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
170 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
171
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
172
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
173 <conditional name="threshold_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
174 <param name="clustering_threshold" type="select" label="How many initial clusters to use as cluster cores" help="After greedy clusering, some of the largest clusters are selected as cluster cores for subsequent clustering procedure. The number of cluster cores can be determined either automatically or manually as top x percent of largest clusters, all clusters satisfying size threshold or exact number of clusters. See -a, --part threshold, -s, --size threshold and -c, --count threshold in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
175 <option value="auto">Automatic setting</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
176 <option value="part">Set percentual proportion</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
177 <option value="size">Set size threshold</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
178 <option value="count">Set explicit count</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
179 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
180 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
181 <when value="part">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
182 <param name="part_threshold" type="float" value="0.025" min="0.00001" max="1.0" label="The proporiton of the largest greedy clusters to be used as cluster cores in subsquent clustering procedure." help="See -a, --part threshold in manual for details." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
183 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
184 <when value="size">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
185 <param name="size_threshold" type="integer" value="10" min="1" label="Minimum size of a greedy cluster needed for it to be used as cluster core in subsquent clustering procedure." help="See -s, --size threshold in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
186 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
187 <when value="count">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
188 <param name="count_threshold" type="integer" value="25" min="1" label="The number of greedy clusters to be used as cluster cores in subsquent clustering procedure." help="See -c, --count threshold in manual for details"/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
189 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
190 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
191
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
192 <conditional name="score_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
193 <param name="set_scores" type="select" label="Clustering rounds" help="Set the number of clustering rounds and score thresholds used. Automatic mode means 3 rounds and score thresholds defined based on mean sequence length.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
194 <option value="auto">Automatic settings</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
195 <option value="set">Set manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
196 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
197 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
198 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
199 <param name="relative_scores" type="select" label="Relative/absolute scores" help="All score thresholds in all clustering rounds can be interpreted either as relative values (per HMM match-state) or absolute values. See -e, --relative thresholds in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
200 <option value="absolute">Scores are absolute values</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
201 <option value="relative">Scores are relative, i.e. per match state</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
202 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
203 <repeat name="round" title="Round">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
204 <param name="assign_score" type="float" value="10.0" min="0.0" label="Assign threshold" help="Minimal score needed for a sequence to be assigned to a cluster. See -n, --assign thresholds in manual for details." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
205 <param name="overlap_score" type="float" value="8.0" min="0.0" label="Overlap threshold" help="Minimal score needed for two clusters to be considered overlapping. This affects cluster merging step heuristic speedup. If this is set to 0.0, full cluster merging routine will be performed, which is the most precise but the slowest. It is suggested to perform full cluster merging routine at least in the last round. See -v, --overlap thresholds in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
206 <param name="merge_score" type="float" value="10.0" min="0.0" label="Merge threshold" help="Minimal score needed for two clusters to be merged. See -r, --merge thresholds in manual for details"/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
207 </repeat>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
208 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
209 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
210
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
211 <param name="min_match_states" type="integer" value="4" min="0" label="Minimal number of HMM match states." help=" Minimal number of match states maintained for each cluster's HMM throughout the computation. This parameter can be also viewed as minimal motif length. See -h, --min match states in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
212
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
213 <param name="max_gap_proportion" type="float" value="0.05" min="0.0" max="1.0" label="Maximal proportion of gaps allowed in a match state" help="Maximal proportion of gaps in HMM match states. Any multiple sequence alignment column containing more gaps will not be considered a match state. See -y, --max gap proportion in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
214
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
215 <param name="min_ic" type="float" value="1.2" min="0.0" max="4.3219280" label="Minimal information content allowed in a match state" help="Minimal information content (In terms of Shannon information theory) of HMM match states. Any multiple sequence alignment column having lower information content will not be considered a match state. Minimum: 0.0 (any MSA column composition), maximum: 4.32 (MSA column containing the same amino acid on each line). See -k, --min ic in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
216
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
217
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
218 <conditional name="match_state_params">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
219 <param name="set_max_aln_length" type="select" label="Maximal alignment length" help="Maximal multiple sequence alignment length for every cluster. Can be either user defined or specify automatically based on mean sequence length. See -j, --max aln length in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
220 <option value="auto">Auto detection</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
221 <option value="set">Set manually</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
222 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
223 <when value="auto" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
224 <when value="set">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
225 <param name="max_aln_length" type="integer" value="24" min="0" label="Maximal alignment length" help="Maximal multiple sequence alignment length for every cluster." />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
226 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
227 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
228
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
229 <param name="max_inner_gaps" type="integer" value="0" min="0" label="Maximum number of inner gaps" help="Maximum number of inner gaps in any line of any cluster's multiple sequence alignment. See -u, --max inner gaps in manual for details."/>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
230
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
231 <conditional name="extension_increase_length">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
232 <param name="set_max_aln_length" type="select" label="Can MSA length be increased during extension step?" help="By default, only cluster merging can increase cluster's multiple sequence alignment length. Setting this option to 'Yes' will allow also sequence insertions to icrease the MSA length. See -q, --extension increase length in manual for details.">
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
233 <option value="false">No</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
234 <option value="true">Yes</option>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
235 </param>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
236 <when value="true" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
237 <when value="false" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
238 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
239 </when>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
240 </conditional>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
241
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
242 </inputs>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
243
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
244 <outputs>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
245 <data format="csv" name="output_clusters" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
246 <data format="csv" name="output_sequences" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
247 </outputs>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
248
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
249 <requirements>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
250 <requirement type="set_environment">HHLIB</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
251 <requirement type="set_environment">HAMMOCK_JAR</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
252 <requirement type="set_environment">MATRIX_PATH</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
253 <requirement type="package" version="1.6.0">java</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
254 <requirement type="package" version="1.2.0">clustalomega</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
255 <requirement type="package" version="3.1b1">hmmer</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
256 <requirement type="package" version="2.0.16">hhsuite</requirement>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
257 </requirements>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
258
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
259
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
260 <tests>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
261 <test>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
262 <param name="input" value="input.fa" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
263 <param name="advanced_greedy_params.max_shift" value="3" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
264 <param name="advanced_greedy_params.shift_penalty" value="0" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
265 <param name="advanced_greedy_params.scoring_matrix" value="blosum62" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
266 <param name="advanced_hmm_params.min_match_states" value="4" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
267 <param name="advanced_hmm_params.min_ic " value="1.2" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
268 <param name="advanced_hmm_params.max_gap_proportion" value="0.05" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
269 <param name="advanced_hmm_params.max_inner_gaps" value="0" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
270
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
271 <output name="output_clusters" file="output_clusters.csv" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
272 <output name="output_sequences" file="output_sequences.csv" />
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
273 </test>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
274 </tests>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
275
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
276
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
277
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
278 <help>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
279
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
280
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
281 **Hammock overview**
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
282
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
283 Hammock performs peptide sequence clustering. It is able to identify clusters of sequences sharing a sequence motif within big datasets. For news, documentation and other available versions, see http://www.recamo.cz/en/software/hammock-cluster-peptides/
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
284
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
285 ------
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
286
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
287 .. class:: infomark
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
288
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
289 **Citation**
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
290 Please cite:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
291
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
292 Krejci A, et al. *in preparation*
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
293
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
294 ------
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
295
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
296 **Input format**
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
297
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
298 Hammock accepts fasta files. For basic work, fasta description lines (those starting with ">") may contain virtually anything. For work with the concept of sequence labels, description line should be in this form:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
299
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
300 | >id|count|label
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
301
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
302 an example of two records in this format:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
303
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
304 | >1|42|label1
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
305 | RSPIVRQLPSLP
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
306 | >2|58|label2
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
307 | GSWVVDISNVED
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
308
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
309 For more detailed description of the label concept and input format, see the documentation_.
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
310
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
311 ------
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
312
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
313 **Outputs**
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
314
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
315 Hammock returns two files, both are semicolon-separated tables.
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
316
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
317 The first is the cluster overview file. It contains one line for each resulting cluster plus header. Columns are:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
318
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
319 cluster_id main_sequence sum label1 label2 label3 ...
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
320
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
321 | cluster_id: Cluster's unique numeric identifier.
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
322 | main_sequence: The most popular (appearing in the highest number of copies) sequence of this cluster
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
323 | sum: Total count of all sequences in this cluster (sum over all labels)
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
324 | label1, label2 etc. Counts of sequences with particular labels
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
325
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
326
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
327 The second file provides more detailed information. It contains one line for each clustered sequence plus header. Columns are:
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
328
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
329 cluster_id sequence alignment sum label1 label2 label3 ...
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
330
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
331 | cluster_id: Id of the cluster this sequence belongs to
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
332 | sequence: Amino acid sequence of this peptide
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
333 | alignment: Aligned amino acid sequence of this peptide (part of cluster's multiple sequence alignment)
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
334 | sum: Total count of copies of this sequence (sum over all labels)
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
335 | label1, label2 etc. Counts of copies with particular labels
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
336
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
337 ------
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
338
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
339 **Parameters**
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
340 Default and auto-detected parameters have been carefully tuned and tested to work well with several datasets, they are especially suited for short peptides from Phage display experiments. Neverheless, there is no such thing as universal rules suitable for every dataset - parameter understanding and tuning may be needed. For more detailed description of parameters, see the documentation_.
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
341
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
342 .. _documentation: http://www.recamo.cz/userfiles/file/Software/Hammock/Hammock-manual.pdf
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
343
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
344
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
345 </help>
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
346
b1ac138f0287 Uploaded
hammock
parents:
diff changeset
347 </tool>