comparison freebayes.xml @ 30:ef2c525bd8cd draft

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/freebayes commit 24f33bda62a7b6771ad42a39fe8c683e09f6d8b8"
author iuc
date Wed, 06 Nov 2019 17:02:57 -0500
parents 156b60c1530f
children 57def2d7c093
comparison
equal deleted inserted replaced
29:156b60c1530f 30:ef2c525bd8cd
1 <tool id="freebayes" name="FreeBayes" version="@DEPENDENCY_VERSION@-0"> 1 <tool id="freebayes" name="FreeBayes" version="@DEPENDENCY_VERSION@">
2 <description>bayesian genetic variant detector</description> 2 <description>bayesian genetic variant detector</description>
3 <macros> 3 <macros>
4 <import>macros.xml</import> 4 <import>macros.xml</import>
5 </macros> 5 </macros>
6 <expand macro="requirements"> 6 <expand macro="requirements">
75 --fasta-reference '${reference_fasta_filename}' 75 --fasta-reference '${reference_fasta_filename}'
76 76
77 ## Outputs 77 ## Outputs
78 --vcf './vcf_output/part_\$i.vcf' 78 --vcf './vcf_output/part_\$i.vcf'
79 79
80 ## Coverage
81 #if str($coverage_options.coverage_options_selector) == "set":
82 @COVERAGE@
83 #end if
84
80 ##advanced options 85 ##advanced options
81 #if str( $options_type.options_type_selector ) == "simple": 86 #if str( $options_type.options_type_selector ) == "simple":
82 #pass 87 #pass
83 #elif str( $options_type.options_type_selector ) == "simple_w_filters": 88 #elif str( $options_type.options_type_selector ) == "simple_w_filters":
84 --standard-filters 89 --standard-filters
85 --min-coverage ${options_type.min_coverage}
86 #elif str( $options_type.options_type_selector ) == "naive": 90 #elif str( $options_type.options_type_selector ) == "naive":
87 --haplotype-length 0 91 --haplotype-length 0
88 --min-alternate-count 1 92 --min-alternate-count 1
89 --min-alternate-fraction 0 93 --min-alternate-fraction 0.05
90 --pooled-continuous 94 --pooled-continuous
91 --report-monomorphic 95 --report-monomorphic
92 #elif str( $options_type.options_type_selector ) == "naive_w_filters": 96 #elif str( $options_type.options_type_selector ) == "naive_w_filters":
93 --haplotype-length 0 97 --haplotype-length 0
94 --min-alternate-count 1 98 --min-alternate-count 1
95 --min-alternate-fraction 0 99 --min-alternate-fraction 0.05
96 --pooled-continuous 100 --pooled-continuous
97 --report-monomorphic 101 --report-monomorphic
98 --standard-filters 102 --standard-filters
99 --min-coverage ${options_type.min_coverage}
100 #elif str( $options_type.options_type_selector ) == "full": 103 #elif str( $options_type.options_type_selector ) == "full":
101 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set': 104 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set':
102 ${options_type.optional_inputs.report_monomorphic} 105 ${options_type.optional_inputs.report_monomorphic}
103 106
104 #if $options_type.optional_inputs.output_trace_option: 107 #if $options_type.optional_inputs.output_trace_option:
187 -z ${options_type.input_filters.mismatch_filters.z} 190 -z ${options_type.input_filters.mismatch_filters.z}
188 191
189 --read-snp-limit ${options_type.input_filters.mismatch_filters.read_snp_limit} 192 --read-snp-limit ${options_type.input_filters.mismatch_filters.read_snp_limit}
190 #end if 193 #end if
191 194
192 --min-coverage ${options_type.input_filters.min_coverage}
193 --min-alternate-qsum ${options_type.input_filters.min_alternate_qsum} 195 --min-alternate-qsum ${options_type.input_filters.min_alternate_qsum}
194 #end if 196 #end if
195 197
196 ## POPULATION AND MAPPABILITY PRIORS 198 ## POPULATION AND MAPPABILITY PRIORS
197 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set": 199 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set":
303 <param name="region_chromosome" argument="--region" type="text" label="Region Chromosome" value="" /> <!--only once? --> 305 <param name="region_chromosome" argument="--region" type="text" label="Region Chromosome" value="" /> <!--only once? -->
304 <param name="region_start" type="integer" label="Region Start" value="" /> 306 <param name="region_start" type="integer" label="Region Start" value="" />
305 <param name="region_end" type="integer" label="Region End" value="" /> 307 <param name="region_end" type="integer" label="Region End" value="" />
306 </when> 308 </when>
307 </conditional> 309 </conditional>
310 <conditional name="coverage_options">
311 <param name="coverage_options_selector" type="select" label="Read coverage"
312 help="Sets --min-coverage, --limit-coverage, and --skip-coverage">
313 <option value="do_not_set" selected="true">Use defaults</option>
314 <option value="set">Specify coverage options</option>
315 </param>
316 <when value="set">
317 <expand macro="par_min_cov" />
318 </when>
319 <when value="do_not_set" />
320 </conditional>
308 <conditional name="options_type"> 321 <conditional name="options_type">
309 <param name="options_type_selector" type="select" label="Choose parameter selection level" 322 <param name="options_type_selector" type="select" label="Choose parameter selection level"
310 help="Select how much control over the freebayes run you need"> 323 help="Select how much control over the freebayes run you need">
311 <option value="simple" selected="true">1. Simple diploid calling</option> 324 <option value="simple" selected="true">1. Simple diploid calling</option>
312 <option value="simple_w_filters">2. Simple diploid calling with filtering and coverage</option> 325 <option value="simple_w_filters">2. Simple diploid calling with filtering and coverage</option>
313 <option value="naive">3. Frequency-based pooled calling</option> 326 <option value="naive">3. Frequency-based pooled calling</option>
314 <option value="naive_w_filters">4. Frequency-based pooled calling with filtering and coverage</option> 327 <option value="naive_w_filters">4. Frequency-based pooled calling with filtering and coverage</option>
315 <option value="full">5. Full list of options</option> 328 <option value="full">5. Full list of options</option>
316 </param> 329 </param>
317 <when value="full"> 330 <when value="full">
331
318 <conditional name="optional_inputs"> 332 <conditional name="optional_inputs">
319 <param name="optional_inputs_selector" type="select" label="Additional inputs" 333 <param name="optional_inputs_selector" type="select" label="Additional inputs"
320 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --variant-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates"> 334 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --variant-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates">
321 <option value="do_not_set" selected="true">Do not provide additional inputs</option> 335 <option value="do_not_set" selected="true">Do not provide additional inputs</option>
322 <option value="set">Provide additional inputs</option> 336 <option value="set">Provide additional inputs</option>
437 help="Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" /> 451 help="Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" />
438 <param name="haplotype_length" argument="--haplotype-length" type="integer" value="3" 452 <param name="haplotype_length" argument="--haplotype-length" type="integer" value="3"
439 label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" /> 453 label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" />
440 <param name="min_repeat_length" argument="--min-repeat-size" type="integer" value="5" 454 <param name="min_repeat_length" argument="--min-repeat-size" type="integer" value="5"
441 label="When assembling observations across repeats, require the total repeat length at least this many bp" /> 455 label="When assembling observations across repeats, require the total repeat length at least this many bp" />
442 <param name="min_repeat_entropy" argument="--min-repeat-entropy" type="integer" value="0" 456 <param name="min_repeat_entropy" argument="--min-repeat-entropy" type="integer" value="1"
443 label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" /> 457 label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" />
444 <param name="no_partial_observations" argument="--no-partial-observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="false" 458 <param name="no_partial_observations" argument="--no-partial-observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="false"
445 label="Exclude observations which do not fully span the dynamically-determined detection window" 459 label="Exclude observations which do not fully span the dynamically-determined detection window"
446 help="By default, FreeBayes uses all observations, dividing partial support across matching haplotypes when generating haplotypes" /> 460 help="By default, FreeBayes uses all observations, dividing partial support across matching haplotypes when generating haplotypes" />
447 </when> 461 </when>
494 label="Exclude reads with more than this number of separate gaps" 508 label="Exclude reads with more than this number of separate gaps"
495 help="default=~unbounded" /> 509 help="default=~unbounded" />
496 <param name="standard_filters" argument="--standard-filters" type="boolean" truevalue="-0" falsevalue="" checked="false" 510 <param name="standard_filters" argument="--standard-filters" type="boolean" truevalue="-0" falsevalue="" checked="false"
497 label="Use stringent input base and mapping quality filters" 511 label="Use stringent input base and mapping quality filters"
498 help="Equivalent to -m 30 -q 20 -R 0 -S 0" /> 512 help="Equivalent to -m 30 -q 20 -R 0 -S 0" />
499 <param name="F" argument="--min-alternate-fraction" type="float" value="0.2" 513 <param name="F" argument="--min-alternate-fraction" type="float" value="0.05"
500 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" /> 514 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" />
501 <param name="C" argument="--min-alternate-count" type="integer" value="2" 515 <param name="C" argument="--min-alternate-count" type="integer" value="2"
502 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" /> 516 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" />
503 <param name="min_alternate_qsum" argument="--min-alternate-qsum" type="integer" value="0" 517 <param name="min_alternate_qsum" argument="--min-alternate-qsum" type="integer" value="0"
504 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" /> 518 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" />
505 <param name="G" argument="--min-alternate-total" type="integer" value="1" 519 <param name="G" argument="--min-alternate-total" type="integer" value="1"
506 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" /> 520 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" />
507 <expand macro="par_min_cov" />
508 </when> 521 </when>
509 <when value="do_not_set" /> 522 <when value="do_not_set" />
510 </conditional> 523 </conditional>
511 524
512 <!-- population and mappability priors --> 525 <!-- population and mappability priors -->
583 </when> 596 </when>
584 <when value="do_not_set" /> 597 <when value="do_not_set" />
585 </conditional> 598 </conditional>
586 </when> 599 </when>
587 <when value="simple" /> 600 <when value="simple" />
588 <when value="simple_w_filters"> 601 <when value="simple_w_filters" />
589 <!-- add standard-filters to command line --> 602 <when value="naive" />
590 <expand macro="par_min_cov" /> 603 <when value="naive_w_filters" />
591 </when>
592 <when value="naive">
593 <!-- build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic -->
594 </when>
595 <when value="naive_w_filters">
596 <!-- build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters-->
597 <expand macro="par_min_cov" />
598 </when>
599 </conditional> 604 </conditional>
600 </inputs> 605 </inputs>
601 <outputs> 606 <outputs>
602 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" /> 607 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" />
603 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)"> 608 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)">
620 <param name="reference_source_selector" value="history" /> 625 <param name="reference_source_selector" value="history" />
621 <param name="processmode" value="individual" /> 626 <param name="processmode" value="individual" />
622 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> 627 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
623 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> 628 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
624 <param name="options_type_selector" value="naive_w_filters"/> 629 <param name="options_type_selector" value="naive_w_filters"/>
630 <param name="coverage_options_selector" value="set" />
625 <param name="min_coverage" value="14"/> 631 <param name="min_coverage" value="14"/>
626 <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" /> 632 <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" />
627 </test> 633 </test>
628 <test> 634 <test>
629 <param name="reference_source_selector" value="history" /> 635 <param name="reference_source_selector" value="history" />
630 <param name="processmode" value="individual" /> 636 <param name="processmode" value="individual" />
631 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> 637 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
632 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> 638 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
633 <param name="options_type_selector" value="naive_w_filters"/> 639 <param name="options_type_selector" value="naive_w_filters"/>
640 <param name="coverage_options_selector" value="set" />
634 <param name="min_coverage" value="14"/> 641 <param name="min_coverage" value="14"/>
635 <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" /> 642 <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" />
636 </test> 643 </test>
637 <test> 644 <test>
638 <param name="reference_source_selector" value="history" /> 645 <param name="reference_source_selector" value="history" />
642 <param name="options_type_selector" value="full"/> 649 <param name="options_type_selector" value="full"/>
643 <param name="population_model_selector" value="set"/> 650 <param name="population_model_selector" value="set"/>
644 <param name="P" value="1"/> 651 <param name="P" value="1"/>
645 <output name="output_vcf" file="freebayes-phix174-test4.vcf" lines_diff="4" /> 652 <output name="output_vcf" file="freebayes-phix174-test4.vcf" lines_diff="4" />
646 </test> 653 </test>
654 <test>
655 <param name="reference_source_selector" value="history" />
656 <param name="processmode" value="individual" />
657 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/>
658 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/>
659 <param name="options_type_selector" value="simple"/>
660 <param name="coverage_options_selector" value="set" />
661 <param name="min_coverage" value="250" />
662 <output name="output_vcf" file="freebayes-hxb2-test5.vcf" lines_diff="4" />
663 </test>
664 <test>
665 <param name="reference_source_selector" value="history" />
666 <param name="processmode" value="individual" />
667 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/>
668 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/>
669 <param name="options_type_selector" value="simple"/>
670 <param name="coverage_options_selector" value="set" />
671 <param name="limit_coverage" value="400" />
672 <output name="output_vcf" file="freebayes-hxb2-test6.vcf" lines_diff="4" />
673 </test>
674 <test>
675 <param name="reference_source_selector" value="history" />
676 <param name="processmode" value="individual" />
677 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/>
678 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/>
679 <param name="options_type_selector" value="simple"/>
680 <param name="coverage_options_selector" value="set" />
681 <param name="skip_coverage" value="100" />
682 <output name="output_vcf" file="freebayes-hxb2-test7.vcf" lines_diff="4" />
683 </test>
647 </tests> 684 </tests>
648 <help> 685 <help><![CDATA[
649 **What it does** 686 **What it does**
650 687
651 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment. 688 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment.
652 689
653 See https://github.com/ekg/freebayes for details on FreeBayes. 690 See https://github.com/ekg/freebayes for details on FreeBayes.
678 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2. 715 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2.
679 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy parameters. 716 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy parameters.
680 717
681 ------ 718 ------
682 719
720 **Command-line parameters**
721
722 **Input**::
723
724 --bam FILE The file or set of BAM files to be analyzed.
725 --bam-list FILE A file containing a list of BAM files to be analyzed.
726
727 --stdin Read BAM input on stdin.
728 --fasta-reference FILE Use FILE as the reference sequence for analysis.
729 An index file (FILE.fai) will be created if none exists.
730 If neither --targets nor --region are specified, FreeBayes
731 will analyze every position in this reference.
732 --targets FILE Limit analysis to targets listed in the BED-format FILE.
733 --region <chrom>:<start>-<end> Limit analysis to the specified region, 0-base coordinates,
734 end_position not included (same as BED format).
735 Either '-' or '..' maybe used as a separator.
736 --samples FILE Limit analysis to samples listed (one per line) in the FILE.
737 By default FreeBayes will analyze all samples in its input
738 BAM files.
739 --populations FILE Each line of FILE should list a sample and a population which
740 it is part of. The population-based bayesian inference model
741 will then be partitioned on the basis of the populations.
742 --cnv-map FILE Read a copy number map from the BED file FILE, which has
743 either a sample-level ploidy:
744 sample_name copy_number
745 or a region-specific format:
746 seq_name start end sample_name copy_number
747 ... for each region in each sample which does not have the
748 default copy number as set by --ploidy. These fields can be delimited
749 by space or tab.
750
751 **Output**::
752
753 --vcf FILE Output VCF-format results to FILE. (default: stdout)
754 --gvcf Write gVCF output, which indicates coverage in uncalled regions.
755 --gvcf-chunk NUM When writing gVCF output emit a record for every NUM bases.
756 --gvcf-dont-use-chunk When writing the gVCF output emit a record for all bases if
757 set to "true" , will also route an int to --gvcf-chunk
758 similar to --output-mode EMIT_ALL_SITES from GATK
759 --variant-input VCF Use variants reported in VCF file as input to the algorithm.
760 Variants in this file will included in the output even if
761 there is not enough support in the data to pass input filters.
762 --only-use-input-alleles Only provide variant calls and genotype likelihoods for sites
763 and alleles which are provided in the VCF input, and provide
764 output in the VCF for all input alleles, not just those which
765 have support in the data.
766 --haplotype-basis-alleles VCF When specified, only variant alleles provided in this input
767 VCF will be used for the construction of complex or haplotype
768 alleles.
769 --report-all-haplotype-alleles At sites where genotypes are made over haplotype alleles,
770 provide information about all alleles in output, not only
771 those which are called.
772 --report-monomorphic Report even loci which appear to be monomorphic, and report all
773 considered alleles, even those which are not in called genotypes.
774 Loci which do not have any potential alternates have '.' for ALT.
775 --pvar N Report sites if the probability that there is a polymorphism
776 at the site is greater than N. default: 0.0. Note that post-
777 filtering is generally recommended over the use of this parameter.
778 --strict-vcf Generate strict VCF format (FORMAT/GQ will be an int)
779
780 **Population model**::
781
782 --theta N The expected mutation rate or pairwise nucleotide diversity
783 among the population under analysis. This serves as the
784 single parameter to the Ewens Sampling Formula prior model
785 default: 0.001
786 --ploidy N Sets the default ploidy for the analysis to N. default: 2
787 --pooled-discrete Assume that samples result from pooled sequencing.
788 Model pooled samples using discrete genotypes across pools.
789 When using this flag, set --ploidy to the number of
790 alleles in each sample or use the --cnv-map to define
791 per-sample ploidy.
792 --pooled-continuous Output all alleles which pass input filters, regardles of
793 genotyping outcome or model.
794
795 **Reference allele**::
796
797 --use-reference-allele This flag includes the reference allele in the analysis as
798 if it is another sample from the same population.
799 --reference-quality MQ,BQ Assign mapping quality of MQ to the reference allele at each
800 site and base quality of BQ. default: 100,60
801
802 **Allele scope**::
803
804 --use-best-n-alleles N Evaluate only the best N SNP alleles, ranked by sum of
805 supporting quality scores. (Set to 0 to use all; default: all)
806 --max-complex-gap
807 --haplotype-length N Allow haplotype calls with contiguous embedded matches of up
808 to this length. Set N=-1 to disable clumping. (default: 3)
809 --min-repeat-size When assembling observations across repeats, require the total repeat
810 length at least this many bp. (default: 5)
811 --min-repeat-entropy N To detect interrupted repeats, build across sequence until it has
812 entropy > N bits per bp. Set to 0 to turn off. (default: 1)
813 --no-partial-observations Exclude observations which do not fully span the dynamically-determined
814 detection window. (default, use all observations, dividing partial
815 support across matching haplotypes when generating haplotypes.)
816
817 **Indel realignment**::
818
819 --dont-left-align-indels Turn off left-alignment of indels, which is enabled by default.
820
821 **Input filters**::
822
823 --use-duplicate-reads Include duplicate-marked alignments in the analysis.
824 default: exclude duplicates marked as such in alignments
825 --min-mapping-quality Q Exclude alignments from analysis if they have a mapping
826 quality less than Q. default: 1
827 --min-base-quality Q Exclude alleles from analysis if their supporting base
828 quality is less than Q. default: 0
829 --min-supporting-allele-qsum Q Consider any allele in which the sum of qualities of supporting
830 observations is at least Q. default: 0
831 --min-supporting-mapping-qsum Q Consider any allele in which and the sum of mapping qualities of
832 supporting reads is at least Q. default: 0
833 --mismatch-base-quality-threshold Q Count mismatches toward --read-mismatch-limit if the base
834 quality of the mismatch is >= Q. default: 10
835 --read-mismatch-limit N Exclude reads with more than N mismatches where each mismatch
836 has base quality >= mismatch-base-quality-threshold.
837 default: ~unbounded
838 --read-max-mismatch-fraction N Exclude reads with more than N [0,1] fraction of mismatches where
839 each mismatch has base quality >= mismatch-base-quality-threshold
840 default: 1.0
841 --read-snp-limit N Exclude reads with more than N base mismatches, ignoring gaps
842 with quality >= mismatch-base-quality-threshold.
843 default: ~unbounded
844 --read-indel-limit N Exclude reads with more than N separate gaps.
845 default: ~unbounded
846 --standard-filters Use stringent input base and mapping quality filters
847 Equivalent to -m 30 -q 20 -R 0 -S 0
848 --min-alternate-fraction N Require at least this fraction of observations supporting
849 an alternate allele within a single individual in the
850 in order to evaluate the position. default: 0.05
851 --min-alternate-count N Require at least this count of observations supporting
852 an alternate allele within a single individual in order
853 to evaluate the position. default: 2
854 --min-alternate-qsum N Require at least this sum of quality of observations supporting
855 an alternate allele within a single individual in order
856 to evaluate the position. default: 0
857 --min-alternate-total N Require at least this count of observations supporting
858 an alternate allele within the total population in order
859 to use the allele in analysis. default: 1
860 --min-coverage N Require at least this coverage to process a site. default: 0
861 --limit-coverage N Downsample per-sample coverage to this level if greater than this coverage.
862 default: no limit
863 --skip-coverage N Skip processing of alignments overlapping positions with coverage >N.
864 This filters sites above this coverage, but will also reduce data nearby.
865 default: no limit
866
867 **Population priors**::
868
869 --no-population-priors Equivalent to --pooled-discrete --hwe-priors-off and removal of
870 Ewens Sampling Formula component of priors.
871
872 **Mappability priors**::
873
874 --hwe-priors-off Disable estimation of the probability of the combination
875 arising under HWE given the allele frequency as estimated
876 by observation frequency.
877 --binomial-obs-priors-off Disable incorporation of prior expectations about observations.
878 Uses read placement probability, strand balance probability,
879 and read position (5'-3') probability.
880 --allele-balance-priors-off Disable use of aggregate probability of observation balance between alleles
881 as a component of the priors.
882
883 **Genotype likelihoods**::
884
885 --observation-bias FILE Read length-dependent allele observation biases from FILE.
886 The format is [length] [alignment efficiency relative to reference]
887 where the efficiency is 1 if there is no relative observation bias.
888 --base-quality-cap Q Limit estimated observation quality by capping base quality at Q.
889 --prob-contamination F An estimate of contamination to use for all samples. default: 10e-9
890 --legacy-gls Use legacy (polybayes equivalent) genotype likelihood calculations
891 --contamination-estimates FILE A file containing per-sample estimates of contamination, such as
892 those generated by VerifyBamID. The format should be:
893 sample p(read=R|genotype=AR) p(read=A|genotype=AA)
894 Sample '*' can be used to set default contamination estimates.
895
896 **Algorithmic features**::
897
898 --report-genotype-likelihood-max Report genotypes using the maximum-likelihood estimate provided
899 from genotype likelihoods.
900 --genotyping-max-iterations N Iterate no more than N times during genotyping step. default: 1000.
901 --genotyping-max-banddepth N Integrate no deeper than the Nth best genotype by likelihood when
902 genotyping. default: 6.
903 --posterior-integration-limits N,M Integrate all genotype combinations in our posterior space
904 which include no more than N samples with their Mth best
905 data likelihood. default: 1,3.
906 --exclude-unobserved-genotypes Skip sample genotypings for which the sample has no supporting reads.
907 --genotype-variant-threshold N Limit posterior integration to samples where the second-best
908 genotype likelihood is no more than log(N) from the highest
909 genotype likelihood for the sample. default: ~unbounded
910 --use-mapping-quality Use mapping quality of alleles when calculating data likelihoods.
911 --harmonic-indel-quality Use a weighted sum of base qualities around an indel, scaled by the
912 distance from the indel. By default use a minimum BQ in flanking sequence.
913 --read-dependence-factor N Incorporate non-independence of reads by scaling successive
914 observations by this factor during data likelihood
915 calculations. default: 0.9
916 --genotype-qualities Calculate the marginal probability of genotypes and report as GQ in
917 each sample field in the VCF output.
918
919 ------
920
683 **Acknowledgments** 921 **Acknowledgments**
684 922
685 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko. 923 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko.
686 TNG was developed by Bjoern Gruening. 924 TNG was developed by Bjoern Gruening.
925 ]]>
687 </help> 926 </help>
688 <expand macro="citations"> 927 <expand macro="citations">
689 <citation type="bibtex"> 928 <citation type="bibtex">
690 @article{Tange2011a, 929 @article{Tange2011a,
691 title = {GNU Parallel - The Command-Line Power Tool}, 930 title = {GNU Parallel - The Command-Line Power Tool},