comparison freebayes.xml @ 23:52aed7d9ed2b draft

planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/freebayes commit cf4a70e780f104bc724323912b3b87fb37f887dd
author devteam
date Sun, 25 Sep 2016 09:48:24 -0400
parents 99684adf84de
children da6e10dee68b
comparison
equal deleted inserted replaced
22:99684adf84de 23:52aed7d9ed2b
1 <?xml version="1.0"?> 1 <tool id="freebayes" name="FreeBayes" version="1.0.2.29--1">
2 <tool id="freebayes" name="FreeBayes" version="0.4.1"> 2 <description> - bayesian genetic variant detector</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="0_9_20_b040236">freebayes</requirement> 4 <requirement type="package" version="1.0.2.29">freebayes</requirement>
5 <requirement type="package" version="0.1.18">samtools</requirement> 5 <requirement type="package" version="0.1.19">samtools</requirement>
6 </requirements> 6 <requirement type="package" version="4.1.3">gawk</requirement>
7 <description> - bayesian genetic variant detector</description> 7 <requirement type="package" version="20160622">parallel</requirement>
8 <command> 8 </requirements>
9 <stdio>
10 <exit_code range="1:" />
11 </stdio>
12 <command>
13 <![CDATA[
9 ##set up input files 14 ##set up input files
10 15
11 #set $reference_fasta_filename = "localref.fa" 16 #set $reference_fasta_filename = "localref.fa"
12 17
13 #if str( $reference_source.reference_source_selector ) == "history": 18 #if str( $reference_source.reference_source_selector ) == "history":
14 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &amp;&amp; 19 ln -s "${reference_source.ref_file}" "${reference_fasta_filename}" &&
15 samtools faidx "${reference_fasta_filename}" 2&gt;&amp;1 || echo "Error running samtools faidx for FreeBayes" &gt;&amp;2 &amp;&amp; 20 samtools faidx "${reference_fasta_filename}" 2>&1 || echo "Error running samtools faidx for FreeBayes" >&2 &&
16 #else: 21 #else:
17 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path ) 22 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
18 #end if 23 #end if
19 24
20 #for $bam_count, $input_bam in enumerate( $reference_source.input_bams ): 25 #for $bam_count, $input_bam in enumerate( $reference_source.input_bams ):
21 ln -s "${input_bam.input_bam}" "localbam_${bam_count}.bam" &amp;&amp; 26 ln -s "${input_bam}" "b_${bam_count}.bam" &&
22 ln -s "${input_bam.input_bam.metadata.bam_index}" "localbam_${bam_count}.bam.bai" &amp;&amp; 27 ln -s "${input_bam.metadata.bam_index}" "b_${bam_count}.bam.bai" &&
23 #end for 28 #end for
24 29
25 ## Tabixize optional input_varinat_vcf file (for --variant-input option) 30 ## Tabixize optional input_varinat_vcf file (for --variant-input option)
26 31 #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and str( $options_type.optional_inputs.optional_inputs_selector ) == 'set' and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
27 #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and $options_type.optional_inputs.optional_inputs_selector and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf": 32 ln -s "${options_type.optional_inputs.input_variant_type.input_variant_vcf}" "input_variant_vcf.vcf.gz" &&
28 ln -s "${options_type.optional_inputs.input_variant_type.input_variant_vcf}" "input_variant_vcf.vcf.gz" &amp;&amp; 33 ln -s "${Tabixized_input}" "input_variant_vcf.vcf.gz.tbi" &&
29 ln -s "${Tabixized_input}" "input_variant_vcf.vcf.gz.tbi" &amp;&amp;
30 #end if 34 #end if
31 35
32 ##finished setting up inputs 36 #for $bam_count, $input_bam in enumerate( $reference_source.input_bams ):
33 37 samtools view -H b_${bam_count}.bam | grep "^@SQ" | cut -f 2- | awk '{ gsub("^SN:","",$1); gsub("^LN:","",$2); print $1"\t0\t"$2; }' >> regions_all.bed &&
34 ##COMMAND LINE STARTS HERE 38 #end for
35 39
40 sort -u regions_all.bed > regions_uniq.bed &&
41 ## split into even small chunks, this has some disatvantages and will not be used for the moment
42 ## bedtools makewindows -b regions_uniq.bed -w 10000000 -s 9990000 > regions.bed &&
43
44 mkdir vcf_output &&
45 mkdir failed_alleles &&
46 mkdir trace &&
47
48 ## Finished setting up inputs
49
50 for i in `cat regions_uniq.bed | awk '{print $1":"$2".."$3}'`;
51 do
52
53 echo "
54
55 ## COMMAND LINE STARTS HERE
56
36 freebayes 57 freebayes
58
59 --region '\$i'
60
37 #for $bam_count, $input_bam in enumerate( $reference_source.input_bams ): 61 #for $bam_count, $input_bam in enumerate( $reference_source.input_bams ):
38 --bam "localbam_${bam_count}.bam" 62 --bam 'b_${bam_count}.bam'
39 #end for 63 #end for
40 --fasta-reference "${reference_fasta_filename}" 64 --fasta-reference '${reference_fasta_filename}'
41 65
42 ##outputs 66 ## Outputs
43 --vcf "${output_vcf}" 67 --vcf './vcf_output/part_\$i.vcf'
44 68
45 #if str( $target_limit_type.target_limit_type_selector ) == "limit_by_target_file": 69 #if str( $target_limit_type.target_limit_type_selector ) == "limit_by_target_file":
46 --targets "${target_limit_type.input_target_bed}" 70 --targets '${target_limit_type.input_target_bed}'
47 #elif str( $target_limit_type.target_limit_type_selector ) == "limit_by_region": 71 #elif str( $target_limit_type.target_limit_type_selector ) == "limit_by_region":
48 --region "${target_limit_type.region_chromosome}:${target_limit_type.region_start}..${target_limit_type.region_end}" 72 --region '${target_limit_type.region_chromosome}:${target_limit_type.region_start}..${target_limit_type.region_end}'
49 #end if 73 #end if
50 74
51 ##advanced options 75 ##advanced options
52 #if str( $options_type.options_type_selector ) == "simple": 76 #if str( $options_type.options_type_selector ) == "simple":
53 ##do nothing as command like build up to this point is sufficinet for simple diploid calling 77 ##do nothing as command like build up to this point is sufficinet for simple diploid calling
54 78
55 #elif str( $options_type.options_type_selector ) == "simple_w_filters": 79 #elif str( $options_type.options_type_selector ) == "simple_w_filters":
56 80 --standard-filters
57 --standard-filters 81 --min-coverage '${options_type.min_coverage}'
58 --min-coverage "${options_type.min_coverage}"
59
60 #elif str( $options_type.options_type_selector ) == "naive": 82 #elif str( $options_type.options_type_selector ) == "naive":
61 83 --haplotype-length 0
62 --haplotype-length 0 84 --min-alternate-count 1
63 --min-alternate-count 1 85 --min-alternate-fraction 0
64 --min-alternate-fraction 0 86 --pooled-continuous
65 --pooled-continuous 87 --report-monomorphic
66 --report-monomorphic
67
68 #elif str( $options_type.options_type_selector ) == "naive_w_filters": 88 #elif str( $options_type.options_type_selector ) == "naive_w_filters":
69 89 --haplotype-length 0
70 --haplotype-length 0 90 --min-alternate-count 1
71 --min-alternate-count 1 91 --min-alternate-fraction 0
72 --min-alternate-fraction 0 92 --pooled-continuous
73 --pooled-continuous 93 --report-monomorphic
74 --report-monomorphic 94 --standard-filters
75 --standard-filters 95 --min-coverage '${options_type.min_coverage}'
76 --min-coverage "${options_type.min_coverage}" 96
77 97 ## Command line direct text entry is not allowed at this time for security reasons
78 ## Command line direct text entry is not allowed at this time for security reasons
79
80 #elif str( $options_type.options_type_selector ) == "full": 98 #elif str( $options_type.options_type_selector ) == "full":
81 99 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set':
82 #if $options_type.optional_inputs.optional_inputs_selector: 100 ${options_type.optional_inputs.report_monomorphic}
83 101
84 ${options_type.optional_inputs.report_monomorphic} 102 #if $options_type.optional_inputs.output_trace_option:
85 103 --trace ./trace/part_'\$i'.txt
86 #if $options_type.optional_inputs.output_trace_option: 104 #end if
87 --trace "${output_trace}" 105 #if $options_type.optional_inputs.output_failed_alleles_option:
88 #end if 106 --failed-alleles ./failed_alleles/part_'\$i'.bed
89 107 #end if
90 #if $options_type.optional_inputs.output_failed_alleles_option: 108 #if $options_type.optional_inputs.samples:
91 --failed-alleles "${output_failed_alleles_bed}" 109 --samples '${options_type.optional_inputs.samples}'
92 #end if 110 #end if
93 111 #if $options_type.optional_inputs.populations:
94 #if $options_type.optional_inputs.samples: 112 --populations '${options_type.optional_inputs.populations}'
95 --samples "${options_type.optional_inputs.samples}" 113 #end if
96 #end if 114 #if $options_type.optional_inputs.A:
97 115 --cnv-map '${options_type.optional_inputs.A}'
98 #if $options_type.optional_inputs.populations: 116 #end if
99 --populations "${options_type.optional_inputs.populations}" 117 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
100 #end if 118 --variant-input 'input_variant_vcf.vcf.gz' ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_varinat_vcf file" section of the command line above
101 119 ${options_type.optional_inputs.input_variant_type.only_use_input_alleles}
102 #if $options_type.optional_inputs.A: 120 #end if
103 --cnv-map "${options_type.optional_inputs.A}" 121 #if $options_type.optional_inputs.haplotype_basis_alleles:
104 #end if 122 --haplotype-basis-alleles '${options_type.optional_inputs.haplotype_basis_alleles}'
105 123 #end if
106 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf": 124 #if $options_type.optional_inputs.observation_bias:
107 --variant-input "input_variant_vcf.vcf.gz" ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_varinat_vcf file" section of the command line above 125 --observation-bias '${options_type.optional_inputs.observation_bias}'
108 ${options_type.optional_inputs.input_variant_type.only_use_input_alleles} 126 #end if
109 #end if 127 #if $options_type.optional_inputs.contamination_estimates:
110 128 --contamination-estimates '${options_type.optional_inputs.contamination_estimates}'
111 #if $options_type.optional_inputs.haplotype_basis_alleles: 129 #end if
112 --haplotype-basis-alleles "${options_type.optional_inputs.haplotype_basis_alleles}"
113 #end if
114
115 #if $options_type.optional_inputs.observation_bias:
116 --observation-bias "${options_type.optional_inputs.observation_bias}"
117 #end if
118
119 #if $options_type.optional_inputs.contamination_estimates:
120 --contamination-estimates "${options_type.optional_inputs.contamination_estimates}"
121 #end if
122
123 #end if 130 #end if
124 131
125 ## REPORTING 132 ## REPORTING
126 133 #if str( $options_type.reporting.reporting_selector ) == "set":
127
128 #if str( $options_type.reporting.reporting_selector ) == "True":
129 --pvar ${options_type.reporting.pvar} 134 --pvar ${options_type.reporting.pvar}
130 #end if 135 #end if
131 136 ## POPULATION MODEL
132 ## POPULATION MODEL 137 #if str( $options_type.population_model.population_model_selector ) == "set":
133 138 --theta '${options_type.population_model.T}'
134 #if str( $options_type.population_model.population_model_selector ) == "True": 139 --ploidy '${options_type.population_model.P}'
135 --theta "${options_type.population_model.T}"
136 --ploidy "${options_type.population_model.P}"
137 ${options_type.population_model.J} 140 ${options_type.population_model.J}
138 ${options_type.population_model.K} 141 ${options_type.population_model.K}
139
140 #end if 142 #end if
141 143
142 ## REFERENCE ALLELE 144 ## REFERENCE ALLELE
143 145 #if str( $options_type.reference_allele.reference_allele_selector ) == "set":
144 #if str( $options_type.reference_allele.reference_allele_selector ) == "True":
145 ${options_type.reference_allele.Z} 146 ${options_type.reference_allele.Z}
146 --reference-quality "${options_type.reference_allele.reference_quality}" 147 --reference-quality '${options_type.reference_allele.reference_quality}'
147 #end if 148 #end if
148 149
149 ## ALLELE SCOPE 150 ## ALLELE SCOPE
150 151 #if str( $options_type.allele_scope.allele_scope_selector ) == "set":
151 #if str( $options_type.allele_scope.allele_scope_selector ) == "True":
152 ${options_type.allele_scope.I} 152 ${options_type.allele_scope.I}
153 ${options_type.allele_scope.i} 153 ${options_type.allele_scope.i}
154 ${options_type.allele_scope.X} 154 ${options_type.allele_scope.X}
155 ${options_type.allele_scope.u} 155 ${options_type.allele_scope.u}
156 -n "${options_type.allele_scope.n}" 156 -n '${options_type.allele_scope.n}'
157 --haplotype-length "${options_type.allele_scope.haplotype_length}" 157 --haplotype-length '${options_type.allele_scope.haplotype_length}'
158 --min-repeat-size "${options_type.allele_scope.min_repeat_length}" 158 --min-repeat-size '${options_type.allele_scope.min_repeat_length}'
159 --min-repeat-entropy "${options_type.allele_scope.min_repeat_entropy}" 159 --min-repeat-entropy '${options_type.allele_scope.min_repeat_entropy}'
160 ${options_type.allele_scope.no_partial_observations} 160 ${options_type.allele_scope.no_partial_observations}
161 #end if 161 #end if
162 162
163 ## REALIGNMENT 163 ## REALIGNMENT
164
165 ${options_type.O} 164 ${options_type.O}
166 165
167 ##INPUT FILTERS 166 ##INPUT FILTERS
168 167 #if str( $options_type.input_filters.input_filters_selector ) == "set":
169 #if str( $options_type.input_filters.input_filters_selector ) == "True":
170 ${options_type.input_filters.use_duplicate_reads} 168 ${options_type.input_filters.use_duplicate_reads}
171 -m "${options_type.input_filters.m}" 169 -m '${options_type.input_filters.m}'
172 -q "${options_type.input_filters.q}" 170 -q '${options_type.input_filters.q}'
173 -R "${options_type.input_filters.R}" 171 -R '${options_type.input_filters.R}'
174 -Y "${options_type.input_filters.Y}" 172 -Y '${options_type.input_filters.Y}'
175 173
176 #if str( $options_type.input_filters.mismatch_filters.mismatch_filters_selector ) == "True": 174 #if str( $options_type.input_filters.mismatch_filters.mismatch_filters_selector ) == "set":
177 -Q "${options_type.input_filters.mismatch_filters.Q}" 175 -Q '${options_type.input_filters.mismatch_filters.Q}'
178 -U "${options_type.input_filters.mismatch_filters.U}" 176 -U '${options_type.input_filters.mismatch_filters.U}'
179 -z "${options_type.input_filters.mismatch_filters.z}" 177 -z '${options_type.input_filters.mismatch_filters.z}'
180 --read-snp-limit "${options_type.input_filters.mismatch_filters.read_snp_limit}" 178 --read-snp-limit '${options_type.input_filters.mismatch_filters.read_snp_limit}'
181 #end if 179 #end if
182 180
183 -e "${options_type.input_filters.e}" 181 -e '${options_type.input_filters.e}'
184 -F "${options_type.input_filters.F}" 182 -F '${options_type.input_filters.F}'
185 -C "${options_type.input_filters.C}" 183 -C '${options_type.input_filters.C}'
186 --min-alternate-qsum "${options_type.input_filters.min_alternate_qsum}" 184 --min-alternate-qsum "${options_type.input_filters.min_alternate_qsum}"
187 -G "${options_type.input_filters.G}" 185 -G '${options_type.input_filters.G}'
188 --min-coverage "${options_type.input_filters.min_coverage}" 186 --min-coverage '${options_type.input_filters.min_coverage}'
189 #end if 187 #end if
190 188
191 ## POPULATION AND MAPPABILITY PRIORS 189 ## POPULATION AND MAPPABILITY PRIORS
192 190 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set":
193 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "True":
194 ${options_type.population_mappability_priors.k} 191 ${options_type.population_mappability_priors.k}
195 ${options_type.population_mappability_priors.w} 192 ${options_type.population_mappability_priors.w}
196 ${options_type.population_mappability_priors.V} 193 ${options_type.population_mappability_priors.V}
197 ${options_type.population_mappability_priors.a} 194 ${options_type.population_mappability_priors.a}
198 #end if 195 #end if
199 196
200 ## GENOTYPE LIKELIHOODS 197 ## GENOTYPE LIKELIHOODS
201 198 #if str( $options_type.genotype_likelihoods.genotype_likelihoods_selector ) == "set":
202 #if str( $options_type.genotype_likelihoods.genotype_likelihoods_selector ) == "True": 199 --base-quality-cap '${$options_type.genotype_likelihoods.base_quality_cap}'
203 --base-quality-cap "${$options_type.genotype_likelihoods.base_quality_cap}"
204 ${$options_type.genotype_likelihoods.experimental_gls} 200 ${$options_type.genotype_likelihoods.experimental_gls}
205 --prob-contamination "${$options_type.genotype_likelihoods.prob_contamination}" 201 --prob-contamination '${$options_type.genotype_likelihoods.prob_contamination}'
206 #end if 202 #end if
207 203
208 ## ALGORITHMIC FEATURES 204 ## ALGORITHMIC FEATURES
209 205 #if str( $options_type.algorithmic_features.algorithmic_features_selector ) == "set":
210 #if str( $options_type.algorithmic_features.algorithmic_features_selector ) == "True":
211 ${options_type.algorithmic_features.report_genotype_likelihood_max} 206 ${options_type.algorithmic_features.report_genotype_likelihood_max}
212 -B "${options_type.algorithmic_features.B}" 207 -B '${options_type.algorithmic_features.B}'
213 --genotyping-max-banddepth "${options_type.algorithmic_features.genotyping_max_banddepth}" 208 --genotyping-max-banddepth '${options_type.algorithmic_features.genotyping_max_banddepth}'
214 -W "${options_type.algorithmic_features.W}" 209 -W '${options_type.algorithmic_features.W}'
215 ${options_type.algorithmic_features.N} 210 ${options_type.algorithmic_features.N}
216 211
217 #if str( $options_type.algorithmic_features.genotype_variant_threshold.genotype_variant_threshold_selector ) == "True": 212 #if str( $options_type.algorithmic_features.genotype_variant_threshold.genotype_variant_threshold_selector ) == "set":
218 -S "${options_type.algorithmic_features.genotype_variant_threshold.S}" 213 -S '${options_type.algorithmic_features.genotype_variant_threshold.S}'
219 #end if 214 #end if
220 215
221 ${options_type.algorithmic_features.j} 216 ${options_type.algorithmic_features.j}
222 ${options_type.algorithmic_features.H} 217 ${options_type.algorithmic_features.H}
223 -D "${options_type.algorithmic_features.D}" 218 -D '${options_type.algorithmic_features.D}'
224 ${options_type.algorithmic_features.genotype_qualities} 219 ${options_type.algorithmic_features.genotype_qualities}
225 #end if 220 #end if
226 #end if 221 #end if
227 222
228 </command> 223 ";
229 224 done > freebayes_commands.sh &&
230 <inputs> 225 cat freebayes_commands.sh | parallel --no-notice -j \${GALAXY_SLOTS:-1} &&
231 <conditional name="reference_source"> 226
232 <param name="reference_source_selector" type="select" label="Load reference genome from"> 227 ## make VCF header
233 <option value="cached">Local cache</option> 228
234 <option value="history">History</option> 229 grep "^#" "./vcf_output/part_\$i.vcf" > header.txt &&
235 </param> 230
236 <when value="cached"> 231 for i in `cat regions_uniq.bed | awk '{print $1":"$2".."$3}'`;
237 <repeat name="input_bams" title="Sample BAM file" min="1"> 232 do
238 <param name="input_bam" type="data" format="bam" label="BAM file"> 233 ## if this fails then it bails out the script
239 <validator type="unspecified_build" /> 234 cat "./vcf_output/part_\$i.vcf" | grep -v "^#" || true
240 <validator type="dataset_metadata_in_data_table" table_name="fasta_indexes" metadata_name="dbkey" metadata_column="1" message="Sequences are not currently available for the specified build." /> 235 ;
236 done | sort -k1,1 -k2,2n -k5,5 -u | cat header.txt - > "${output_vcf}"
237
238 #if str( $options_type.options_type_selector ) == "full":
239 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set':
240 #if $options_type.optional_inputs.output_failed_alleles_option:
241 &&
242 for i in `cat regions.bed | awk '{print $1":"$2".."$3}'`;
243 do
244 cat "./failed_alleles/part_\$i.bed"
245 ;
246 done > '${output_failed_alleles_bed}'
247 #end if
248
249 #if $options_type.optional_inputs.output_trace_option:
250 &&
251 for i in `cat regions.bed | awk '{print $1":"$2".."$3}'`;
252 do
253 cat './trace/part_\$i.txt'
254 ;
255 done > '${output_trace}'
256 #end if
257 #end if
258 #end if
259 ]]>
260 </command>
261
262 <inputs>
263 <conditional name="reference_source">
264 <param name="reference_source_selector" type="select" label="Load reference genome from">
265 <option value="cached">Local cache</option>
266 <option value="history">History</option>
241 </param> 267 </param>
242 </repeat> 268 <when value="cached">
243 269 <param name="input_bams" type="data" format="bam" multiple="True" label="BAM file">
244 <param name="ref_file" type="select" label="Using reference genome"> 270 <validator type="unspecified_build" />
245 <options from_data_table="fasta_indexes"></options> 271 <validator type="dataset_metadata_in_data_table" table_name="fasta_indexes" metadata_name="dbkey" metadata_column="1" message="Sequences are not currently available for the specified build." />
246 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/> 272 </param>
247 </param> 273 <param name="ref_file" type="select" label="Using reference genome">
248 </when> 274 <options from_data_table="fasta_indexes"></options>
249 <when value="history"> <!-- FIX ME!!!! --> 275 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input file"/>
250 <repeat name="input_bams" title="Sample BAM file" min="1"> 276 </param>
251 <param name="input_bam" type="data" format="bam" label="BAM file" /> 277 </when>
252 </repeat> 278 <when value="history"> <!-- FIX ME!!!! -->
253 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence" help="You can upload a FASTA sequence to the history and use it as reference" /> 279 <param name="input_bams" type="data" format="bam" multiple="True" label="BAM file" />
254 </when> 280 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence"
255 </conditional> 281 help="You can upload a FASTA sequence to the history and use it as reference" />
256 282 </when>
257 <conditional name="target_limit_type"> 283 </conditional>
258 <param name="target_limit_type_selector" type="select" label="Limit variant calling to a set of regions?" help="Sets --targets or --region options"> 284 <conditional name="target_limit_type">
259 <option value="do_not_limit" selected="True">Do not limit</option> 285 <param name="target_limit_type_selector" type="select" label="Limit variant calling to a set of regions?" help="Sets --targets or --region options">
260 <option value="limit_by_target_file">Limit by target file</option> 286 <option value="do_not_limit" selected="True">Do not limit</option>
261 <option value="limit_by_region">Limit to region</option> 287 <option value="limit_by_target_file">Limit by target file</option>
262 </param> 288 <option value="limit_by_region">Limit to region</option>
263 <when value="do_not_limit"> 289 </param>
264 <!-- Do nothing here --> 290 <when value="do_not_limit">
265 </when>
266 <when value="limit_by_target_file">
267 <param name="input_target_bed" type="data" format="bed" label="Limit analysis to targets listed in the BED-format FILE." help="-t --targets"/>
268 </when>
269 <when value="limit_by_region">
270 <param name="region_chromosome" type="text" label="Region Chromosome" value="" help="-r --region"/> <!--only once? -->
271 <param name="region_start" type="integer" label="Region Start" value="" />
272 <param name="region_end" type="integer" label="Region End" value="" />
273 </when>
274 </conditional>
275
276 <conditional name="options_type">
277 <param name="options_type_selector" type="select" label="Choose parameter selection level" help="Select how much control over the freebayes run you need" >
278 <option value="simple" selected="True">1:Simple diploid calling</option>
279 <option value="simple_w_filters">2:Simple diploid calling with filtering and coverage</option>
280 <option value="naive">3:Frequency-based pooled calling</option>
281 <option value="naive_w_filters">4:Frequency-based pooled calling with filtering and coverage</option>
282 <option value="full">5:Complete list of all options</option>
283 <!-- We will not alloow command line text boxes at this time
284 <option value="cline">6:Input parameters on the command line</option>
285 -->
286 </param>
287 <when value="full">
288
289 <conditional name="optional_inputs">
290 <param name="optional_inputs_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Do you want to provide additional inputs?" help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --varinat-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates" />
291 <when value="set">
292 <param name="output_failed_alleles_option" type="boolean" truevalue="--failed-alleles" falsevalue="" checked="False" label="Write out failed alleles file" help="--failed-alleles" />
293 <param name="output_trace_option" type="boolean" truevalue="--trace" falsevalue="" checked="False" label="Write out algorithm trace file" help="--trace"/>
294 <param name="samples" type="data" format="txt" label="Limit analysis to samples listed (one per line) in the FILE" optional="True" help="-s --samples; default=By default FreeBayes will analyze all samples in its input BAM files"/>
295 <param name="populations" type="data" format="txt" label="Populations File" optional="True" help="--populations; default=False. Each line of FILE should list a sample and a population which it is part of. The population-based bayesian inference model will then be partitioned on the basis of the populations" />
296 <param name="A" type="data" format="bed" label="Read a copy number map from the BED file FILE" optional="True" help="-A --cnv-map; default=copy number is set to as specified by --ploidy. Read a copy number map from the BED file FILE, which has the format: reference sequence, start, end, sample name, copy number ... for each region in each sample which does not have the default copy number as set by --ploidy."/>
297 <conditional name="input_variant_type">
298 <param name="input_variant_type_selector" type="select" label="Provide variants file">
299 <option value="do_not_provide" selected="True">Do not provide</option>
300 <option value="provide_vcf">Provide VCF file</option>
301 </param>
302 <when value="do_not_provide">
303 <!-- Do nothing here --> 291 <!-- Do nothing here -->
304 </when> 292 </when>
305 <when value="provide_vcf"> 293 <when value="limit_by_target_file">
306 <param name="input_variant_vcf" type="data" format="vcf_bgzip" label="Use variants reported in VCF file as input to the algorithm"> 294 <param name="input_target_bed" type="data" format="bed" label="Limit analysis to targets listed in the BED-format FILE." help="-t --targets"/>
307 <conversion name="Tabixized_input" type="tabix" /> 295 </when>
308 </param> 296 <when value="limit_by_region">
309 <param name="only_use_input_alleles" type="boolean" truevalue="--only-use-input-alleles" falsevalue="" checked="False" label="Only provide variant calls and genotype likelihoods for sites in VCF" /> 297 <param name="region_chromosome" type="text" label="Region Chromosome" value="" help="-r --region"/> <!--only once? -->
310 </when> 298 <param name="region_start" type="integer" label="Region Start" value="" />
311 </conditional> 299 <param name="region_end" type="integer" label="Region End" value="" />
312 <param name="haplotype_basis_alleles" type="data" format="vcf" label="Only use variant alleles provided in this input VCF for the construction of complex or haplotype alleles" optional="True" help="--haplotype-basis-alleles" /> 300 </when>
313 <param name="report_monomorphic" type="boolean" truevalue="--report-monomorphic" falsevalue="" checked="False" label="Report even loci which appear to be monomorphic, and report all considered alleles, even those which are not in called genotypes." help="--report-monomorphic " />
314 <param name="observation_bias" optional="True" type="data" format="tabular" label="Load read length-dependent allele observation biases from" help="--observation-bias; The format is [length] [alignment efficiency relative to reference] where the efficiency is 1 if there is no relative observation bias" />
315 <param name="contamination_estimates" optional="True" type="data" format="tabular" label="Upload per-sample estimates of contamination from" help="--contamination-estimates; The format should be: sample p(read=R|genotype=AR) p(read=A|genotype=AA) Sample '*' can be used to set default contamination estimates." />
316 </when>
317 <when value="do_not_set">
318 <!-- do nothing -->
319 </when>
320 </conditional> 301 </conditional>
321 302 <conditional name="options_type">
322 <!-- reporting --> 303 <param name="options_type_selector" type="select" label="Choose parameter selection level" help="Select how much control over the freebayes run you need" >
323 304 <option value="simple" selected="True">1:Simple diploid calling</option>
324 <conditional name="reporting"> 305 <option value="simple_w_filters">2:Simple diploid calling with filtering and coverage</option>
325 <param name="reporting_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Set reporting option?" help="Sets -P --pvar option" /> 306 <option value="naive">3:Frequency-based pooled calling</option>
326 <when value="set"> 307 <option value="naive_w_filters">4:Frequency-based pooled calling with filtering and coverage</option>
327 <param name="pvar" type="float" value="0.0" label="Report sites if the probability that there is a polymorphism at the site is greater than" help="-P --pvar; default=0.0. Note that post-filtering is generally recommended over the use of this parameter. " /> 308 <option value="full">5:Complete list of all options</option>
328 </when> 309 <!-- We will not alloow command line text boxes at this time
329 <when value="do_not_set"> 310 <option value="cline">6:Input parameters on the command line</option>
330 <!-- do nothing --> 311 -->
331 </when> 312 </param>
313 <when value="full">
314 <conditional name="optional_inputs">
315 <param name="optional_inputs_selector" type="select" label="Additional inputs"
316 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --varinat-input, --only-use-input-alleles, --haplotype-basis-alleles,
317 --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates">
318 <option value="do_not_set" selected="true">Do not provide additional inputs</option>
319 <option value="set">Provide additional inputs</option>
320 </param>
321 <when value="set">
322 <param name="output_failed_alleles_option" type="boolean" truevalue="--failed-alleles" falsevalue="" checked="False"
323 label="Write out failed alleles file" help="--failed-alleles" />
324 <param name="output_trace_option" type="boolean" truevalue="--trace" falsevalue="" checked="False"
325 label="Write out algorithm trace file" help="--trace"/>
326 <param name="samples" type="data" format="txt" label="Limit analysis to samples listed (one per line) in the FILE" optional="True"
327 help="-s --samples; default=By default FreeBayes will analyze all samples in its input BAM files"/>
328 <param name="populations" type="data" format="txt" label="Populations File" optional="True"
329 help="--populations; default=False. Each line of FILE should list a sample and a population which it is part of.
330 The population-based bayesian inference model will then be partitioned on the basis of the populations" />
331 <param name="A" type="data" format="bed" label="Read a copy number map from the BED file FILE" optional="True"
332 help="-A --cnv-map; default=copy number is set to as specified by --ploidy. Read a copy number map from the BED file FILE, which has the format:
333 reference sequence, start, end, sample name, copy number ... for each region in each sample which does not have the default copy number as set by --ploidy."/>
334 <conditional name="input_variant_type">
335 <param name="input_variant_type_selector" type="select" label="Provide variants file">
336 <option value="do_not_provide" selected="True">Do not provide</option>
337 <option value="provide_vcf">Provide VCF file</option>
338 </param>
339 <when value="do_not_provide">
340 <!-- Do nothing here -->
341 </when>
342 <when value="provide_vcf">
343 <param name="input_variant_vcf" type="data" format="vcf_bgzip" label="Use variants reported in VCF file as input to the algorithm">
344 <conversion name="Tabixized_input" type="tabix" />
345 </param>
346 <param name="only_use_input_alleles" type="boolean" truevalue="--only-use-input-alleles" falsevalue="" checked="False" label="Only provide variant calls and genotype likelihoods for sites in VCF" />
347 </when>
348 </conditional>
349 <param name="haplotype_basis_alleles" type="data" format="vcf" label="Only use variant alleles provided in this input VCF for the construction of complex or haplotype alleles" optional="True"
350 help="--haplotype-basis-alleles" />
351 <param name="report_monomorphic" type="boolean" truevalue="--report-monomorphic" falsevalue="" checked="False"
352 label="Report even loci which appear to be monomorphic, and report all considered alleles, even those which are not in called genotypes."
353 help="--report-monomorphic " />
354 <param name="observation_bias" optional="True" type="data" format="tabular" label="Load read length-dependent allele observation biases from"
355 help="--observation-bias; The format is [length] [alignment efficiency relative to reference] where the efficiency is 1 if there is no relative observation bias" />
356 <param name="contamination_estimates" optional="True" type="data" format="tabular" label="Upload per-sample estimates of contamination from"
357 help="--contamination-estimates; The format should be: sample p(read=R|genotype=AR) p(read=A|genotype=AA) Sample '*' can be used to set default contamination estimates." />
358 </when>
359 <when value="do_not_set">
360 <!-- do nothing -->
361 </when>
362 </conditional>
363 <!-- reporting -->
364 <conditional name="reporting">
365 <param name="reporting_selector" type="select" label="Reporting options" help="Sets -P --pvar option">
366 <option value="do_not_set" selected="True">Use defaults</option>
367 <option value="set">Set reporting options</option>
368 </param>
369 <when value="set">
370 <param name="pvar" type="float" value="0.0" label="Report sites if the probability that there is a polymorphism at the site is greater than"
371 help="-P --pvar; default=0.0. Note that post-filtering is generally recommended over the use of this parameter. " />
372 </when>
373 <when value="do_not_set">
374 <!-- do nothing -->
375 </when>
376 </conditional>
377 <!-- population model -->
378 <conditional name="population_model">
379 <param name="population_model_selector" type="select" label="Population model options"
380 help="Sets --theta, --ploidy, --pooled-discrete, and --pooled-continuous options " >
381 <option value="do_not_set" selected="true">Use defaults</option>
382 <option value="set">Set population model options</option>
383 </param>
384 <when value="set">
385 <param name="T" type="float" value="0.001" label="The expected mutation rate or pairwise nucleotide diversity among the population under analysis"
386 help="-T --theta; default = 0.001. This serves as the single parameter to the Ewens Sampling Formula prior model." />
387 <param name="P" type="integer" value="2" label="Set ploidy for the analysis" help="-p --ploidy; default=2" />
388 <param name="J" type="boolean" truevalue="-J" falsevalue="" checked="False" label="Assume that samples result from pooled sequencing"
389 help="-J --pooled-discrete; default=False. Model pooled samples using discrete genotypes across pools.
390 When using this flag, set --ploidy to the number of alleles in each sample or use the --cnv-map to define per-sample ploidy." />
391 <param name="K" type="boolean" truevalue="-K" falsevalue="" checked="False" label="Output all alleles which pass input filters, regardles of genotyping outcome or model"
392 help="-K, --poled-continuous; default=False." />
393 </when>
394 <when value="do_not_set">
395 <!-- do nothing -->
396 </when>
397 </conditional>
398 <!-- reference allele -->
399 <conditional name="reference_allele">
400 <param name="reference_allele_selector" type="select" label="Reference allele options"
401 help="Sets --use-reference-allele and --reference-quality options.">
402 <option value="do_not_set" selected="true">Use defaults</option>
403 <option value="set">Set reference allele options</option>
404 </param>
405 <when value="set">
406 <param name="Z" type="boolean" truevalue="-Z" falsevalue="" checked="False" label="Include the reference allele in the analysis as if it is another sample from the same population"
407 help="-Z --use-reference-allele; default=False" />
408 <param name="reference_quality" type="text" value="100,60" label="Assign mapping quality of MQ (100) to the reference allele at each site and base quality of BQ (60)"
409 help="--reference-quality; default=100,60 " />
410 </when>
411 <when value="do_not_set">
412 <!-- do nothing -->
413 </when>
414 </conditional>
415 <!-- allelic scope -->
416 <conditional name="allele_scope">
417 <param name="allele_scope_selector" type="select" label="Allelic scope options"
418 help="Sets -I, i, -X, -u, -n, --haplotype-length, --min-repeat-size, --min-repeat-entropy, and --no-partial-observations options.">
419 <option value="do_not_set" selected="true">Use defaults</option>
420 <option value="set">Set alleic scope options</option>
421 </param>
422 <when value="set">
423 <param name="I" type="boolean" truevalue="-I" falsevalue="" checked="False" label="Ignore SNP alleles" help="-I --no-snps; default=False" />
424 <param name="i" type="boolean" truevalue="-i" falsevalue="" checked="False" label="Ignore indels alleles" help="-i --no-indels; default=False" />
425 <param name="X" type="boolean" truevalue="-X" falsevalue="" checked="False" label="Ignore multi-nucleotide polymorphisms, MNPs" help="-X --no-mnps; default=False" />
426 <param name="u" type="boolean" truevalue="-u" falsevalue="" checked="False" label="Ignore complex events (composites of other classes)."
427 help="-u --no-complex; default=False" />
428 <param name="n" type="integer" value="0" label="How many best SNP alleles to evaluate"
429 help="-n --use-best-n-alleles; default=0 (all). Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" />
430 <param name="haplotype_length" type="integer" value="3" label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)"
431 help="-E --max-complex-gap --haplotype-length; default=3." />
432 <param name="min_repeat_length" type="integer" value="5" label="When assembling observations across repeats, require the total repeat length at least this many bp"
433 help="--min-repeat-size; default=5." />
434 <param name="min_repeat_entropy" type="integer" value="0" label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)"
435 help="--min-repeat-entropy; default=0 (off)." />
436 <param name="no_partial_observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="False"
437 label="Exclude observations which do not fully span the dynamically-determined detection window"
438 help="--no-partial-observations; default=use all observations, dividing partial support across matching haplotypes when generating haplotypes." />
439 </when>
440 <when value="do_not_set">
441 <!-- do nothing -->
442 </when>
443 </conditional>
444 <!-- indel realignment -->
445 <param name="O" type="boolean" truevalue="-O" falsevalue="" checked="False" label="Turn off left-alignment of indels?"
446 help="-O --dont-left-align-indels; default=False (do left align)." />
447 <!-- input filters -->
448 <conditional name="input_filters">
449 <param name="input_filters_selector" type="select" label="Input filters"
450 help="Sets -4, -m, -q, -R, -Y, -Q, -U, -z, -&#36;, -e, -0, -F, -C, -3, -G, and -&#33; options.">
451 <option value="do_not_set" selected="true">No input filters (default)</option>
452 <option value="set">Set input filters</option>
453 </param>
454 <when value="set">
455 <param name="use_duplicate_reads" type="boolean" truevalue="--use-duplicate-reads" falsevalue="" checked="False"
456 label="Include duplicate-marked alignments in the analysis."
457 help="-4 --use-duplicate-reads; default=False (exclude duplicates marked as such in alignments)." />
458 <param name="m" type="integer" value="1" label="Exclude alignments from analysis if they have a mapping quality less than"
459 help="-m --min-mapping-quality; default=1" />
460 <param name="q" type="integer" value="0" label="Exclude alleles from analysis if their supporting base quality less than"
461 help="-q --min-base-quality; default=0" />
462 <param name="R" type="integer" value="0" label="Consider any allele in which the sum of qualities of supporting observations is at least"
463 help="-R --min-supporting-allele-qsum; default=0" />
464 <param name="Y" type="integer" value="0" label="Consider any allele in which and the sum of mapping qualities of supporting reads is at least"
465 help="-Y --min-supporting-mapping-qsum; default=0" />
466 <conditional name="mismatch_filters">
467 <param name="mismatch_filters_selector" type="select" label="Mismatch filters"
468 help="Sets -Q, -U, -z, and &#36; options">
469 <option value="do_not_set" selected="true">No mismatch filters (default)</option>
470 <option value="set">Set mismatch filters</option>
471 </param>
472 <when value="set">
473 <param name="Q" type="integer" value="10" label="Count mismatches toward -U (option below) if the base quality of the mismatch is >="
474 help="-Q --mismatch-base-quality-threshold; default=10" />
475 <param name="U" type="integer" value="1000" optional="True" label="Exclude reads with more than N mismatches where each mismatch has base quality >= Q (option above)"
476 help="-U --read-mismatch-limit; default=~unbound" />
477 <param name="z" type="float" value="1.0" min="0.0" max="1.0"
478 label="Exclude reads with more than N [0,1] fraction of mismatches where each mismatch has base quality >= Q (second option above)"
479 help="-z --read-max-mismatch-fraction; default=1.0" />
480 <param name="read_snp_limit" type="integer"
481 value="1000" label="Exclude reads with more than N base mismatches, ignoring gaps with quality >= Q (third option abobe)"
482 help="-$amp; --read-snp-limit N " />
483 </when>
484 <when value="do_not_set">
485 <!-- do nothing -->
486 </when>
487 </conditional>
488 <param name="e" type="integer" value="1000" label="Exclude reads with more than this number of separate gaps"
489 help="-e --read-snp-limit; default=~unbounded" />
490 <param name="standard_filters" type="boolean" truevalue="-0" falsevalue="" checked="False" label="Use stringent input base and mapping quality filters"
491 help="-0 --standard-filters; default=False. Equivalent to -m 30 -q 20 -R 0 -S 0" />
492 <param name="F" type="float" value="0.2"
493 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position"
494 help="-F --min-alternate-fraction; default=0.2" />
495 <param name="C" type="integer" value="2"
496 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position"
497 help="-C --min-alternate-count; default=2" />
498 <param name="min_alternate_qsum" type="integer" value="0"
499 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position"
500 help="-3 --min-alternate-qsum; default=0" />
501 <param name="G" type="integer" value="1"
502 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis"
503 help="-G --min-alternate-total N; default=1" />
504 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site"
505 help="-! --min-coverage; default=0 " />
506 </when>
507 <when value="do_not_set">
508 <!-- do nothing -->
509 </when>
510 </conditional>
511 <!-- population and mappability priors -->
512 <conditional name="population_mappability_priors">
513 <param name="population_mappability_priors_selector" type="select" label="Population and mappability priors"
514 help="Sets -k, -w, -V, and -a options.">
515 <option value="do_not_set" selected="true">Use defaults</option>
516 <option value="set">Set population and mappability priors</option>
517 </param>
518 <when value="set">
519 <param name="k" type="boolean" truevalue="-k" falsevalue="" checked="False" label="No population priors"
520 help="-k --no-population-priors; default=False. Equivalent to --pooled-discrete --hwe-priors-off and removal of Ewens Sampling Formula component of priors." />
521 <param name="w" type="boolean" truevalue="-w" falsevalue="" checked="False"
522 label="Disable estimation of the probability of the combination arising under HWE given the allele frequency as estimated by observation frequency"
523 help="-w --hwe-priors-off; default=False" />
524 <param name="V" type="boolean" truevalue="-V" falsevalue="" checked="False" label="Disable incorporation of prior expectations about observations"
525 help="-V --binomial-obs-priors-off; default=False. Uses read placement probability, strand balance probability, and read position (5&#39;'-3&#39;') probability." />
526 <param name="a" type="boolean" truevalue="-a" falsevalue="" checked="False"
527 label="isable use of aggregate probability of observation balance between alleles as a component of the priors"
528 help="-a --allele-balance-priors-off; default=False " />
529 </when>
530 <when value="do_not_set">
531 <!-- do nothing -->
532 </when>
533 </conditional>
534 <!-- genotype likelihoods -->
535 <conditional name="genotype_likelihoods">
536 <param name="genotype_likelihoods_selector" type="select" label="Genotype likelihood options"
537 help="Sets --base-quality-cap, --experimental-gls, and --prob-contamination options.">
538 <option value="do_not_set" selected="true">Use defaults</option>
539 <option value="set">Set genotype likelihood options</option>
540 </param>
541 <when value="set">
542 <param name="base_quality_cap" type="integer" value="0" label="Limit estimated observation quality by capping base quality at" help="--base-quality-cap" />
543 <param name="experimental_gls" type="boolean" truevalue="--experimental-gls" falsevalue="" checked="False"
544 label="Generate genotype likelihoods using 'effective base depth' metric qual = 1-BaseQual * 1-MapQual"
545 help="--experimental-gls; Incorporate partial observations. This is the default when contamination estimates are provided. Optimized for diploid samples." />
546 <param name="prob_contamination" type="float" value="10e-9" label="An estimate of contamination to use for all samples"
547 help="--prob-contamination; default=10e-9." />
548 </when>
549 <when value="do_not_set">
550 <!-- do nothing -->
551 </when>
552 </conditional>
553 <!-- algorithmic features -->
554 <conditional name="algorithmic_features">
555 <param name="algorithmic_features_selector" type="select" label="Algorithmic features"
556 help="Sets --report-genotypes-likelihood-max, -B, --genotyping-max-banddepth, -W, -N, S, -j, -H, -D, -= options">
557 <option value="do_not_set" selected="true">Use defaults</option>
558 <option value="set">Set algorithmic features</option>
559 </param>
560 <when value="set">
561 <param name="report_genotype_likelihood_max" type="boolean" truevalue="--report-genotype-likelihood-max" falsevalue="" checked="False"
562 label="Report genotypes using the maximum-likelihood estimate provided from genotype likelihoods."
563 help="--report-genotype-likelihood-max; default=False" />
564 <param name="B" type="integer" value="1000" label="Iterate no more than N times during genotyping step"
565 help="-B --genotyping-max-iterations; default=1000." />
566 <param name="genotyping_max_banddepth" type="integer" value="6" label="Integrate no deeper than the Nth best genotype by likelihood when genotyping"
567 help="--genotyping-max-banddepth; default=6" />
568 <param name="W" type="text" value="1,3"
569 label="Integrate all genotype combinations in our posterior space which include no more than N (1) samples with their Mth (3) best data likelihood"
570 help="-W --posterior-integration-limits; default=1,3" />
571 <param name="N" type="boolean" truevalue="--exclude-unobserved-genotypes" falsevalue="" checked="False"
572 label="Skip sample genotypings for which the sample has no supporting reads"
573 help="-N --exclude-unobserved-genotypes; default=False" />
574 <conditional name="genotype_variant_threshold">
575 <param name="genotype_variant_threshold_selector" type="select"
576 label="Limit posterior integration"
577 help="-S --genotype-variant-threshold">
578 <option value="do_not_set" selected="true">Do not limit posterior integration</option>
579 <option value="set">Set posterior integration limit</option>
580 </param>
581 <when value="do_not_set">
582 <!-- do nothing -->
583 </when>
584 <when value="set">
585 <param name="S" value="" type="integer"
586 label="Limit posterior integration to samples where the second-best genotype likelihood is no more than log(N) from the highest genotype likelihood for the sample."
587 help="-S --genotype-variant-threshold; default=~unbounded" />
588 </when>
589 </conditional>
590 <param name="j" type="boolean" truevalue="-j" falsevalue="" checked="False" label="Use mapping quality of alleles when calculating data likelihoods"
591 help="-j --use-mapping-quality; default=False" />
592 <param name="H" type="boolean" truevalue="-H" falsevalue="" checked="False"
593 label="Use a weighted sum of base qualities around an indel, scaled by the distance from the indel"
594 help="-H --harmonic-indel-quality; default=use a minimum Base Quality in flanking sequence." />
595 <param name="D" type="float" value="0.9" label="Incorporate non-independence of reads by scaling successive observations by this factor during data likelihood calculations"
596 help="-D --read-dependence-factor; default=0.9." />
597 <param name="genotype_qualities" type="boolean" truevalue="--genotype-qualities" falsevalue="" checked="False"
598 label="Calculate the marginal probability of genotypes and report as GQ in each sample field in the VCF output"
599 help="-= --genotype-qualities; default=False " />
600 </when>
601 <when value="do_not_set">
602 <!-- do nothing -->
603 </when>
604 </conditional>
605 </when>
606 <when value="simple">
607 <!-- do nothing -->
608 </when>
609 <when value="simple_w_filters">
610 <!-- add standard-filters to command line -->
611 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
612 </when>
613 <when value="naive">
614 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic -->
615 </when>
616 <when value="naive_w_filters">
617 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters-->
618 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
619 </when>
332 </conditional> 620 </conditional>
333 621 </inputs>
334 <!-- population model --> 622 <outputs>
335 623 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" />
336 <conditional name="population_model"> 624 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)">
337 <param name="population_model_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Set population model?" help="Sets --theta, --ploidy, --pooled-discrete, and --pooled-continuous options " /> 625 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] == 'set' and options_type['optional_inputs']['output_failed_alleles_option'] is True</filter>
338 <when value="set"> 626 </data>
339 <param name="T" type="float" value="0.001" label="The expected mutation rate or pairwise nucleotide diversity among the population under analysis" help="-T --theta; default = 0.001. This serves as the single parameter to the Ewens Sampling Formula prior model." /> 627 <data format="txt" name="output_trace" label="${tool.name} on ${on_string} (trace)">
340 <param name="P" type="integer" value="2" label="Set ploidy for the analysis" help="-p --ploidy; default=2" /> 628 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] == 'set' and options_type['optional_inputs']['output_trace_option'] is True</filter>
341 <param name="J" type="boolean" truevalue="-J" falsevalue="" checked="False" label="Assume that samples result from pooled sequencing" help="-J --pooled-discrete; default=False. Model pooled samples using discrete genotypes across pools. When using this flag, set --ploidy to the number of alleles in each sample or use the --cnv-map to define per-sample ploidy." /> 629 </data>
342 <param name="K" type="boolean" truevalue="-K" falsevalue="" checked="False" label="Output all alleles which pass input filters, regardles of genotyping outcome or model" help="-K, --poled-continuous; default=False. " /> 630 </outputs>
343 </when> 631 <tests>
344 <when value="do_not_set"> 632 <test>
345 <!-- do nothing --> 633 <param name="reference_source_selector" value="history" />
346 </when> 634 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
347 </conditional> 635 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
348 636 <param name="options_type_selector" value="simple"/>
349 <!-- reference allele --> 637 <output name="output_vcf" file="freebayes-phix174-test1.vcf" compare="contains"/>
350 638 </test>
351 <conditional name="reference_allele"> 639 <test>
352 <param name="reference_allele_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Use reference allele?" help="Sets --use-reference-allele and --reference-quality options " /> 640 <param name="reference_source_selector" value="history" />
353 <when value="set"> 641 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
354 <param name="Z" type="boolean" truevalue="-Z" falsevalue="" checked="False" label="Include the reference allele in the analysis as if it is another sample from the same population" help="-Z --use-reference-allele; default=False" /> 642 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
355 <param name="reference_quality" type="text" value="100,60" label="Assign mapping quality of MQ (100) to the reference allele at each site and base quality of BQ (60)" help="--reference-quality; default=100,60 " /> 643 <param name="options_type_selector" value="naive_w_filters"/>
356 </when> 644 <param name="min_coverage" value="14"/>
357 <when value="do_not_set"> 645 <output name="output_vcf" file="freebayes-phix174-test2.vcf" compare="contains"/>
358 <!-- do nothing --> 646 </test>
359 </when> 647 <test>
360 </conditional> 648 <param name="reference_source_selector" value="history" />
361 649 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
362 <!-- allelic scope --> 650 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
363 651 <param name="options_type_selector" value="naive_w_filters"/>
364 <conditional name="allele_scope"> 652 <param name="min_coverage" value="14"/>
365 <param name="allele_scope_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Set allelic scope?" help="Sets -I, i, -X, -u, -n, --haplotype-length, --min-repeat-size, --min-repeat-entropy, and --no-partial-observations options " /> 653 <output name="output_vcf" file="freebayes-phix174-test3.vcf" compare="contains"/>
366 <when value="set"> 654 </test>
367 <param name="I" type="boolean" truevalue="-I" falsevalue="" checked="False" label="Ignore SNP alleles" help="-I --no-snps; default=False" /> 655 <test>
368 <param name="i" type="boolean" truevalue="-i" falsevalue="" checked="False" label="Ignore indels alleles" help="-i --no-indels; default=False" /> 656 <param name="reference_source_selector" value="history" />
369 <param name="X" type="boolean" truevalue="-X" falsevalue="" checked="False" label="Ignore multi-nucleotide polymorphisms, MNPs" help="-X --no-mnps; default=False" /> 657 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
370 <param name="u" type="boolean" truevalue="-u" falsevalue="" checked="False" label="Ignore complex events (composites of other classes)." help="-u --no-complex; default=False" /> 658 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
371 <param name="n" type="integer" value="0" label="How many best SNP alleles to evaluate" help="-n --use-best-n-alleles; default=0 (all). Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" /> 659 <param name="options_type_selector" value="full"/>
372 <param name="haplotype_length" type="integer" value="3" label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" help="-E --max-complex-gap --haplotype-length; default=3." /> 660 <param name="population_model_selector" value="set"/>
373 <param name="min_repeat_length" type="integer" value="5" label="When assembling observations across repeats, require the total repeat length at least this many bp" help="--min-repeat-size; default=5." /> 661 <param name="P" value="1"/>
374 <param name="min_repeat_entropy" type="integer" value="0" label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" help="--min-repeat-entropy; default=0 (off)." /> 662 <output name="output_vcf" file="freebayes-phix174-test4.vcf" compare="contains"/>
375 <param name="no_partial_observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="False" label="Exclude observations which do not fully span the dynamically-determined detection window" help="--no-partial-observations; default=use all observations, dividing partial support across matching haplotypes when generating haplotypes. " /> 663 </test>
376 </when> 664 </tests>
377 <when value="do_not_set"> 665 <help>
378 <!-- do nothing -->
379 </when>
380 </conditional>
381
382 <!-- indel realignment -->
383
384 <param name="O" type="boolean" truevalue="-O" falsevalue="" checked="False" label="Turn off left-alignment of indels?" help="-O --dont-left-align-indels; default=False (do left align). " />
385
386 <!-- input filters -->
387
388 <conditional name="input_filters">
389 <param name="input_filters_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Set input filters?" help="Sets -4, -m, -q, -R, -Y, -Q, -U, -z, -&#36;, -e, -0, -F, -C, -3, -G, and -&#33; options " />
390 <when value="set">
391 <param name="use_duplicate_reads" type="boolean" truevalue="--use-duplicate-reads" falsevalue="" checked="False" label="Include duplicate-marked alignments in the analysis." help="-4 --use-duplicate-reads; default=False (exclude duplicates marked as such in alignments)." />
392 <param name="m" type="integer" value="1" label="Exclude alignments from analysis if they have a mapping quality less than" help="-m --min-mapping-quality; default=1" />
393 <param name="q" type="integer" value="0" label="Exclude alleles from analysis if their supporting base quality less than" help="-q --min-base-quality; default=0" />
394 <param name="R" type="integer" value="0" label="Consider any allele in which the sum of qualities of supporting observations is at least" help="-R --min-supporting-allele-qsum; default=0" />
395 <param name="Y" type="integer" value="0" label="Consider any allele in which and the sum of mapping qualities of supporting reads is at least" help="-Y --min-supporting-mapping-qsum; default=0" />
396 <conditional name="mismatch_filters">
397 <param name="mismatch_filters_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Perform mismatch filtering?" help="Sets -Q, -U, -z, and &#36; options" />
398 <when value="set">
399 <param name="Q" type="integer" value="10" label="Count mismatches toward -U (option below) if the base quality of the mismatch is >=" help="-Q --mismatch-base-quality-threshold; default=10" />
400 <param name="U" type="integer" value="1000" optional="True" label="Exclude reads with more than N mismatches where each mismatch has base quality >= Q (option above)" help="-U --read-mismatch-limit; default=~unbound" />
401 <param name="z" type="float" value="1.0" min="0.0" max="1.0" label="Exclude reads with more than N [0,1] fraction of mismatches where each mismatch has base quality >= Q (second option above)" help="-z --read-max-mismatch-fraction; default=1.0" />
402 <param name="read_snp_limit" type="integer" value="1000" label="Exclude reads with more than N base mismatches, ignoring gaps with quality >= Q (third option abobe)" help="-$amp; --read-snp-limit N " />
403 </when>
404 <when value="do_not_set">
405 <!-- do nothing -->
406 </when>
407 </conditional>
408 <param name="e" type="integer" value="1000" label="Exclude reads with more than this number of separate gaps" help="-e --read-snp-limit; default=~unbounded" />
409 <param name="standard_filters" type="boolean" truevalue="-0" falsevalue="" checked="False" label="Use stringent input base and mapping quality filters" help="-0 --standard-filters; default=False. Equivalent to -m 30 -q 20 -R 0 -S 0" />
410 <param name="F" type="float" value="0.2" label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" help="-F --min-alternate-fraction; default=0.2" />
411 <param name="C" type="integer" value="2" label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" help="-C --min-alternate-count; default=2" />
412 <param name="min_alternate_qsum" type="integer" value="0" label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" help="-3 --min-alternate-qsum; default=0" />
413 <param name="G" type="integer" value="1" label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" help="-G --min-alternate-total N; default=1" />
414 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
415 </when>
416 <when value="do_not_set">
417 <!-- do nothing -->
418 </when>
419 </conditional>
420
421 <!-- population and mappability priors -->
422
423 <conditional name="population_mappability_priors">
424 <param name="population_mappability_priors_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Set population and mappability priors?" help="Sets -k, -w, -V, and -a options " />
425 <when value="set">
426 <param name="k" type="boolean" truevalue="-k" falsevalue="" checked="False" label="No population priors" help="-k --no-population-priors; default=False. Equivalent to --pooled-discrete --hwe-priors-off and removal of Ewens Sampling Formula component of priors." />
427 <param name="w" type="boolean" truevalue="-w" falsevalue="" checked="False" label="Disable estimation of the probability of the combination arising under HWE given the allele frequency as estimated by observation frequency" help="-w --hwe-priors-off; default=False" />
428 <param name="V" type="boolean" truevalue="-V" falsevalue="" checked="False" label="Disable incorporation of prior expectations about observations" help="-V --binomial-obs-priors-off; default=False. Uses read placement probability, strand balance probability, and read position (5&#39;'-3&#39;') probability." />
429 <param name="a" type="boolean" truevalue="-a" falsevalue="" checked="False" label="isable use of aggregate probability of observation balance between alleles as a component of the priors" help="-a --allele-balance-priors-off; default=False " />
430 </when>
431 <when value="do_not_set">
432 <!-- do nothing -->
433 </when>
434 </conditional>
435
436 <!-- genotype likelihoods -->
437
438 <conditional name="genotype_likelihoods">
439 <param name="genotype_likelihoods_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Tweak genotype likelihoods?" help="Sets --base-quality-cap, --experimental-gls, and --prob-contamination options. " />
440 <when value="set">
441 <param name="base_quality_cap" type="integer" value="0" label="Limit estimated observation quality by capping base quality at" help="--base-quality-cap" />
442 <param name="experimental_gls" type="boolean" truevalue="--experimental-gls" falsevalue="" checked="False" label="Generate genotype likelihoods using 'effective base depth' metric qual = 1-BaseQual * 1-MapQual" help="--experimental-gls; Incorporate partial observations. This is the default when contamination estimates are provided. Optimized for diploid samples." />
443 <param name="prob_contamination" type="float" value="10e-9" label="An estimate of contamination to use for all samples. " help="--prob-contamination; default=10e-9." />
444 </when>
445 <when value="do_not_set">
446 <!-- do nothing -->
447 </when>
448 </conditional>
449
450 <!-- algorithmic features -->
451
452 <conditional name="algorithmic_features">
453 <param name="algorithmic_features_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Tweak algorithmic features?" help="Sets --report-genotypes-likelihood-max, -B, --genotyping-max-banddepth, -W, -N, S, -j, -H, -D, -= options " />
454 <when value="set">
455 <param name="report_genotype_likelihood_max" type="boolean" truevalue="--report-genotype-likelihood-max" falsevalue="" checked="False" label="Report genotypes using the maximum-likelihood estimate provided from genotype likelihoods." help="--report-genotype-likelihood-max; default=False" />
456 <param name="B" type="integer" value="1000" label="Iterate no more than N times during genotyping step" help="-B --genotyping-max-iterations; default=1000." />
457 <param name="genotyping_max_banddepth" type="integer" value="6" label="Integrate no deeper than the Nth best genotype by likelihood when genotyping" help="--genotyping-max-banddepth; default=6" />
458 <param name="W" type="text" value="1,3" label="Integrate all genotype combinations in our posterior space which include no more than N (1) samples with their Mth (3) best data likelihood" help="-W --posterior-integration-limits; default=1,3" />
459 <param name="N" type="boolean" truevalue="--exclude-unobserved-genotypes" falsevalue="" checked="False" label="Skip sample genotypings for which the sample has no supporting reads" help="-N --exclude-unobserved-genotypes; default=False" />
460 <conditional name="genotype_variant_threshold">
461 <param name="genotype_variant_threshold_selector" type="boolean" truevalue="set" falsevalue="do_not_set" label="Do you want to to limit posterior integration" help="-S --genotype-variant-threshold" />
462 <when value="do_not_set">
463 <!-- do nothing -->
464 </when>
465 <when value="set">
466 <param name="S" value="" type="integer" label="Limit posterior integration to samples where the second-best genotype likelihood is no more than log(N) from the highest genotype likelihood for the sample." help="-S --genotype-variant-threshold; default=~unbounded" />
467 </when>
468 </conditional>
469 <param name="j" type="boolean" truevalue="-j" falsevalue="" checked="False" label="Use mapping quality of alleles when calculating data likelihoods" help="-j --use-mapping-quality; default=False" />
470 <param name="H" type="boolean" truevalue="-H" falsevalue="" checked="False" label="Use a weighted sum of base qualities around an indel, scaled by the distance from the indel" help="-H --harmonic-indel-quality; default=use a minimum Base Quality in flanking sequence." />
471 <param name="D" type="float" value="0.9" label="Incorporate non-independence of reads by scaling successive observations by this factor during data likelihood calculations" help="-D --read-dependence-factor; default=0.9." />
472 <param name="genotype_qualities" type="boolean" truevalue="--genotype-qualities" falsevalue="" checked="False" label="Calculate the marginal probability of genotypes and report as GQ in each sample field in the VCF output" help="-= --genotype-qualities; default=False " />
473 </when>
474 <when value="do_not_set">
475 <!-- do nothing -->
476 </when>
477 </conditional>
478 </when>
479 <when value="simple">
480 <!-- do nothing -->
481 </when>
482 <when value="simple_w_filters">
483 <!-- add standard-filters to command line -->
484 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
485 </when>
486 <when value="naive">
487 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic -->
488 </when>
489 <when value="naive_w_filters">
490 <!-- do nothing build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters-->
491 <param name="min_coverage" type="integer" value="0" label="Require at least this coverage to process a site" help="-! --min-coverage; default=0 " />
492 </when>
493 </conditional>
494
495 </inputs>
496
497 <outputs>
498 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" />
499 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)">
500 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] is True and options_type['optional_inputs']['output_failed_alleles_option'] is True</filter>
501 </data>
502 <data format="txt" name="output_trace" label="${tool.name} on ${on_string} (trace)">
503 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] is True and options_type['optional_inputs']['output_trace_option'] is True</filter>
504 </data>
505 </outputs>
506 <tests>
507 <test>
508 <param name="reference_source_selector" value="history" />
509 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
510 <param name="input_bam" ftype="bam" value="freebayes-phix174.bam"/>
511 <param name="options_type_selector" value="simple"/>
512 <output name="output_vcf" file="freebayes-phix174-test1.vcf" compare="contains"/>
513 </test>
514 <test>
515 <param name="reference_source_selector" value="history" />
516 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
517 <param name="input_bam" ftype="bam" value="freebayes-phix174.bam"/>
518 <param name="options_type_selector" value="naive_w_filters"/>
519 <param name="min_coverage" value="14"/>
520 <output name="output_vcf" file="freebayes-phix174-test2.vcf" compare="contains"/>
521 </test>
522 </tests>
523 <stdio>
524 <exit_code range="1:" />
525 </stdio>
526 <help>
527 **What it does** 666 **What it does**
528 667
529 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment. 668 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment.
530 669
531 See https://github.com/ekg/freebayes for details on FreeBayes. 670 See https://github.com/ekg/freebayes for details on FreeBayes.
532
533 This Galaxy instance of FreeBayes corresponds to release 0.9.20
534 671
535 ------ 672 ------
536 673
537 **Description** 674 **Description**
538 675
811 **Citation** 948 **Citation**
812 949
813 For the underlying tool, please cite `Erik Garrison and Gabor Marth. Haplotype-based variant detection from short-read sequencing &lt;http://arxiv.org/abs/1207.3907&gt;`_. 950 For the underlying tool, please cite `Erik Garrison and Gabor Marth. Haplotype-based variant detection from short-read sequencing &lt;http://arxiv.org/abs/1207.3907&gt;`_.
814 951
815 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko. 952 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko.
816 953 TNG was developed by Bjoern Gruening
817 </help> 954
818 955 </help>
819 <citations> 956 <citations>
820 <citation type="bibtex">@misc{1207.3907, 957 <citation type="bibtex">@misc{1207.3907,
821 Author = {Erik Garrison}, 958 Author = {Erik Garrison},
822 Title = {Haplotype-based variant detection from short-read sequencing}, 959 Title = {Haplotype-based variant detection from short-read sequencing},
823 Year = {2012}, 960 Year = {2012},
824 Eprint = {arXiv:1207.3907}, 961 Eprint = {arXiv:1207.3907},
825 url = {http://arxiv.org/abs/1207.3907}, 962 url = {http://arxiv.org/abs/1207.3907},
826 }</citation> 963 }</citation>
827 </citations> 964 </citations>
828 </tool> 965 </tool>