Mercurial > repos > devteam > freebayes
comparison freebayes.xml @ 30:ef2c525bd8cd draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/freebayes commit 24f33bda62a7b6771ad42a39fe8c683e09f6d8b8"
author | iuc |
---|---|
date | Wed, 06 Nov 2019 17:02:57 -0500 |
parents | 156b60c1530f |
children | 57def2d7c093 |
comparison
equal
deleted
inserted
replaced
29:156b60c1530f | 30:ef2c525bd8cd |
---|---|
1 <tool id="freebayes" name="FreeBayes" version="@DEPENDENCY_VERSION@-0"> | 1 <tool id="freebayes" name="FreeBayes" version="@DEPENDENCY_VERSION@"> |
2 <description>bayesian genetic variant detector</description> | 2 <description>bayesian genetic variant detector</description> |
3 <macros> | 3 <macros> |
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="requirements"> | 6 <expand macro="requirements"> |
75 --fasta-reference '${reference_fasta_filename}' | 75 --fasta-reference '${reference_fasta_filename}' |
76 | 76 |
77 ## Outputs | 77 ## Outputs |
78 --vcf './vcf_output/part_\$i.vcf' | 78 --vcf './vcf_output/part_\$i.vcf' |
79 | 79 |
80 ## Coverage | |
81 #if str($coverage_options.coverage_options_selector) == "set": | |
82 @COVERAGE@ | |
83 #end if | |
84 | |
80 ##advanced options | 85 ##advanced options |
81 #if str( $options_type.options_type_selector ) == "simple": | 86 #if str( $options_type.options_type_selector ) == "simple": |
82 #pass | 87 #pass |
83 #elif str( $options_type.options_type_selector ) == "simple_w_filters": | 88 #elif str( $options_type.options_type_selector ) == "simple_w_filters": |
84 --standard-filters | 89 --standard-filters |
85 --min-coverage ${options_type.min_coverage} | |
86 #elif str( $options_type.options_type_selector ) == "naive": | 90 #elif str( $options_type.options_type_selector ) == "naive": |
87 --haplotype-length 0 | 91 --haplotype-length 0 |
88 --min-alternate-count 1 | 92 --min-alternate-count 1 |
89 --min-alternate-fraction 0 | 93 --min-alternate-fraction 0.05 |
90 --pooled-continuous | 94 --pooled-continuous |
91 --report-monomorphic | 95 --report-monomorphic |
92 #elif str( $options_type.options_type_selector ) == "naive_w_filters": | 96 #elif str( $options_type.options_type_selector ) == "naive_w_filters": |
93 --haplotype-length 0 | 97 --haplotype-length 0 |
94 --min-alternate-count 1 | 98 --min-alternate-count 1 |
95 --min-alternate-fraction 0 | 99 --min-alternate-fraction 0.05 |
96 --pooled-continuous | 100 --pooled-continuous |
97 --report-monomorphic | 101 --report-monomorphic |
98 --standard-filters | 102 --standard-filters |
99 --min-coverage ${options_type.min_coverage} | |
100 #elif str( $options_type.options_type_selector ) == "full": | 103 #elif str( $options_type.options_type_selector ) == "full": |
101 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set': | 104 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set': |
102 ${options_type.optional_inputs.report_monomorphic} | 105 ${options_type.optional_inputs.report_monomorphic} |
103 | 106 |
104 #if $options_type.optional_inputs.output_trace_option: | 107 #if $options_type.optional_inputs.output_trace_option: |
187 -z ${options_type.input_filters.mismatch_filters.z} | 190 -z ${options_type.input_filters.mismatch_filters.z} |
188 | 191 |
189 --read-snp-limit ${options_type.input_filters.mismatch_filters.read_snp_limit} | 192 --read-snp-limit ${options_type.input_filters.mismatch_filters.read_snp_limit} |
190 #end if | 193 #end if |
191 | 194 |
192 --min-coverage ${options_type.input_filters.min_coverage} | |
193 --min-alternate-qsum ${options_type.input_filters.min_alternate_qsum} | 195 --min-alternate-qsum ${options_type.input_filters.min_alternate_qsum} |
194 #end if | 196 #end if |
195 | 197 |
196 ## POPULATION AND MAPPABILITY PRIORS | 198 ## POPULATION AND MAPPABILITY PRIORS |
197 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set": | 199 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set": |
303 <param name="region_chromosome" argument="--region" type="text" label="Region Chromosome" value="" /> <!--only once? --> | 305 <param name="region_chromosome" argument="--region" type="text" label="Region Chromosome" value="" /> <!--only once? --> |
304 <param name="region_start" type="integer" label="Region Start" value="" /> | 306 <param name="region_start" type="integer" label="Region Start" value="" /> |
305 <param name="region_end" type="integer" label="Region End" value="" /> | 307 <param name="region_end" type="integer" label="Region End" value="" /> |
306 </when> | 308 </when> |
307 </conditional> | 309 </conditional> |
310 <conditional name="coverage_options"> | |
311 <param name="coverage_options_selector" type="select" label="Read coverage" | |
312 help="Sets --min-coverage, --limit-coverage, and --skip-coverage"> | |
313 <option value="do_not_set" selected="true">Use defaults</option> | |
314 <option value="set">Specify coverage options</option> | |
315 </param> | |
316 <when value="set"> | |
317 <expand macro="par_min_cov" /> | |
318 </when> | |
319 <when value="do_not_set" /> | |
320 </conditional> | |
308 <conditional name="options_type"> | 321 <conditional name="options_type"> |
309 <param name="options_type_selector" type="select" label="Choose parameter selection level" | 322 <param name="options_type_selector" type="select" label="Choose parameter selection level" |
310 help="Select how much control over the freebayes run you need"> | 323 help="Select how much control over the freebayes run you need"> |
311 <option value="simple" selected="true">1. Simple diploid calling</option> | 324 <option value="simple" selected="true">1. Simple diploid calling</option> |
312 <option value="simple_w_filters">2. Simple diploid calling with filtering and coverage</option> | 325 <option value="simple_w_filters">2. Simple diploid calling with filtering and coverage</option> |
313 <option value="naive">3. Frequency-based pooled calling</option> | 326 <option value="naive">3. Frequency-based pooled calling</option> |
314 <option value="naive_w_filters">4. Frequency-based pooled calling with filtering and coverage</option> | 327 <option value="naive_w_filters">4. Frequency-based pooled calling with filtering and coverage</option> |
315 <option value="full">5. Full list of options</option> | 328 <option value="full">5. Full list of options</option> |
316 </param> | 329 </param> |
317 <when value="full"> | 330 <when value="full"> |
331 | |
318 <conditional name="optional_inputs"> | 332 <conditional name="optional_inputs"> |
319 <param name="optional_inputs_selector" type="select" label="Additional inputs" | 333 <param name="optional_inputs_selector" type="select" label="Additional inputs" |
320 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --variant-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates"> | 334 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --variant-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates"> |
321 <option value="do_not_set" selected="true">Do not provide additional inputs</option> | 335 <option value="do_not_set" selected="true">Do not provide additional inputs</option> |
322 <option value="set">Provide additional inputs</option> | 336 <option value="set">Provide additional inputs</option> |
437 help="Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" /> | 451 help="Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" /> |
438 <param name="haplotype_length" argument="--haplotype-length" type="integer" value="3" | 452 <param name="haplotype_length" argument="--haplotype-length" type="integer" value="3" |
439 label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" /> | 453 label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" /> |
440 <param name="min_repeat_length" argument="--min-repeat-size" type="integer" value="5" | 454 <param name="min_repeat_length" argument="--min-repeat-size" type="integer" value="5" |
441 label="When assembling observations across repeats, require the total repeat length at least this many bp" /> | 455 label="When assembling observations across repeats, require the total repeat length at least this many bp" /> |
442 <param name="min_repeat_entropy" argument="--min-repeat-entropy" type="integer" value="0" | 456 <param name="min_repeat_entropy" argument="--min-repeat-entropy" type="integer" value="1" |
443 label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" /> | 457 label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" /> |
444 <param name="no_partial_observations" argument="--no-partial-observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="false" | 458 <param name="no_partial_observations" argument="--no-partial-observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="false" |
445 label="Exclude observations which do not fully span the dynamically-determined detection window" | 459 label="Exclude observations which do not fully span the dynamically-determined detection window" |
446 help="By default, FreeBayes uses all observations, dividing partial support across matching haplotypes when generating haplotypes" /> | 460 help="By default, FreeBayes uses all observations, dividing partial support across matching haplotypes when generating haplotypes" /> |
447 </when> | 461 </when> |
494 label="Exclude reads with more than this number of separate gaps" | 508 label="Exclude reads with more than this number of separate gaps" |
495 help="default=~unbounded" /> | 509 help="default=~unbounded" /> |
496 <param name="standard_filters" argument="--standard-filters" type="boolean" truevalue="-0" falsevalue="" checked="false" | 510 <param name="standard_filters" argument="--standard-filters" type="boolean" truevalue="-0" falsevalue="" checked="false" |
497 label="Use stringent input base and mapping quality filters" | 511 label="Use stringent input base and mapping quality filters" |
498 help="Equivalent to -m 30 -q 20 -R 0 -S 0" /> | 512 help="Equivalent to -m 30 -q 20 -R 0 -S 0" /> |
499 <param name="F" argument="--min-alternate-fraction" type="float" value="0.2" | 513 <param name="F" argument="--min-alternate-fraction" type="float" value="0.05" |
500 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" /> | 514 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" /> |
501 <param name="C" argument="--min-alternate-count" type="integer" value="2" | 515 <param name="C" argument="--min-alternate-count" type="integer" value="2" |
502 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" /> | 516 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" /> |
503 <param name="min_alternate_qsum" argument="--min-alternate-qsum" type="integer" value="0" | 517 <param name="min_alternate_qsum" argument="--min-alternate-qsum" type="integer" value="0" |
504 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" /> | 518 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" /> |
505 <param name="G" argument="--min-alternate-total" type="integer" value="1" | 519 <param name="G" argument="--min-alternate-total" type="integer" value="1" |
506 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" /> | 520 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" /> |
507 <expand macro="par_min_cov" /> | |
508 </when> | 521 </when> |
509 <when value="do_not_set" /> | 522 <when value="do_not_set" /> |
510 </conditional> | 523 </conditional> |
511 | 524 |
512 <!-- population and mappability priors --> | 525 <!-- population and mappability priors --> |
583 </when> | 596 </when> |
584 <when value="do_not_set" /> | 597 <when value="do_not_set" /> |
585 </conditional> | 598 </conditional> |
586 </when> | 599 </when> |
587 <when value="simple" /> | 600 <when value="simple" /> |
588 <when value="simple_w_filters"> | 601 <when value="simple_w_filters" /> |
589 <!-- add standard-filters to command line --> | 602 <when value="naive" /> |
590 <expand macro="par_min_cov" /> | 603 <when value="naive_w_filters" /> |
591 </when> | |
592 <when value="naive"> | |
593 <!-- build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic --> | |
594 </when> | |
595 <when value="naive_w_filters"> | |
596 <!-- build command line using haplotype-length 0 min-alternate-count 1 min-alternate-fraction 0 pooled-continuous report-monomorphic standard-filters--> | |
597 <expand macro="par_min_cov" /> | |
598 </when> | |
599 </conditional> | 604 </conditional> |
600 </inputs> | 605 </inputs> |
601 <outputs> | 606 <outputs> |
602 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" /> | 607 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" /> |
603 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)"> | 608 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)"> |
620 <param name="reference_source_selector" value="history" /> | 625 <param name="reference_source_selector" value="history" /> |
621 <param name="processmode" value="individual" /> | 626 <param name="processmode" value="individual" /> |
622 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> | 627 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> |
623 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> | 628 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> |
624 <param name="options_type_selector" value="naive_w_filters"/> | 629 <param name="options_type_selector" value="naive_w_filters"/> |
630 <param name="coverage_options_selector" value="set" /> | |
625 <param name="min_coverage" value="14"/> | 631 <param name="min_coverage" value="14"/> |
626 <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" /> | 632 <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" /> |
627 </test> | 633 </test> |
628 <test> | 634 <test> |
629 <param name="reference_source_selector" value="history" /> | 635 <param name="reference_source_selector" value="history" /> |
630 <param name="processmode" value="individual" /> | 636 <param name="processmode" value="individual" /> |
631 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> | 637 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/> |
632 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> | 638 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/> |
633 <param name="options_type_selector" value="naive_w_filters"/> | 639 <param name="options_type_selector" value="naive_w_filters"/> |
640 <param name="coverage_options_selector" value="set" /> | |
634 <param name="min_coverage" value="14"/> | 641 <param name="min_coverage" value="14"/> |
635 <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" /> | 642 <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" /> |
636 </test> | 643 </test> |
637 <test> | 644 <test> |
638 <param name="reference_source_selector" value="history" /> | 645 <param name="reference_source_selector" value="history" /> |
642 <param name="options_type_selector" value="full"/> | 649 <param name="options_type_selector" value="full"/> |
643 <param name="population_model_selector" value="set"/> | 650 <param name="population_model_selector" value="set"/> |
644 <param name="P" value="1"/> | 651 <param name="P" value="1"/> |
645 <output name="output_vcf" file="freebayes-phix174-test4.vcf" lines_diff="4" /> | 652 <output name="output_vcf" file="freebayes-phix174-test4.vcf" lines_diff="4" /> |
646 </test> | 653 </test> |
654 <test> | |
655 <param name="reference_source_selector" value="history" /> | |
656 <param name="processmode" value="individual" /> | |
657 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/> | |
658 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/> | |
659 <param name="options_type_selector" value="simple"/> | |
660 <param name="coverage_options_selector" value="set" /> | |
661 <param name="min_coverage" value="250" /> | |
662 <output name="output_vcf" file="freebayes-hxb2-test5.vcf" lines_diff="4" /> | |
663 </test> | |
664 <test> | |
665 <param name="reference_source_selector" value="history" /> | |
666 <param name="processmode" value="individual" /> | |
667 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/> | |
668 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/> | |
669 <param name="options_type_selector" value="simple"/> | |
670 <param name="coverage_options_selector" value="set" /> | |
671 <param name="limit_coverage" value="400" /> | |
672 <output name="output_vcf" file="freebayes-hxb2-test6.vcf" lines_diff="4" /> | |
673 </test> | |
674 <test> | |
675 <param name="reference_source_selector" value="history" /> | |
676 <param name="processmode" value="individual" /> | |
677 <param name="ref_file" ftype="fasta" value="freebayes-hxb2.fasta"/> | |
678 <param name="input_bams" ftype="bam" value="freebayes-hxb2.bam"/> | |
679 <param name="options_type_selector" value="simple"/> | |
680 <param name="coverage_options_selector" value="set" /> | |
681 <param name="skip_coverage" value="100" /> | |
682 <output name="output_vcf" file="freebayes-hxb2-test7.vcf" lines_diff="4" /> | |
683 </test> | |
647 </tests> | 684 </tests> |
648 <help> | 685 <help><![CDATA[ |
649 **What it does** | 686 **What it does** |
650 | 687 |
651 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment. | 688 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment. |
652 | 689 |
653 See https://github.com/ekg/freebayes for details on FreeBayes. | 690 See https://github.com/ekg/freebayes for details on FreeBayes. |
678 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2. | 715 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2. |
679 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy parameters. | 716 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy parameters. |
680 | 717 |
681 ------ | 718 ------ |
682 | 719 |
720 **Command-line parameters** | |
721 | |
722 **Input**:: | |
723 | |
724 --bam FILE The file or set of BAM files to be analyzed. | |
725 --bam-list FILE A file containing a list of BAM files to be analyzed. | |
726 | |
727 --stdin Read BAM input on stdin. | |
728 --fasta-reference FILE Use FILE as the reference sequence for analysis. | |
729 An index file (FILE.fai) will be created if none exists. | |
730 If neither --targets nor --region are specified, FreeBayes | |
731 will analyze every position in this reference. | |
732 --targets FILE Limit analysis to targets listed in the BED-format FILE. | |
733 --region <chrom>:<start>-<end> Limit analysis to the specified region, 0-base coordinates, | |
734 end_position not included (same as BED format). | |
735 Either '-' or '..' maybe used as a separator. | |
736 --samples FILE Limit analysis to samples listed (one per line) in the FILE. | |
737 By default FreeBayes will analyze all samples in its input | |
738 BAM files. | |
739 --populations FILE Each line of FILE should list a sample and a population which | |
740 it is part of. The population-based bayesian inference model | |
741 will then be partitioned on the basis of the populations. | |
742 --cnv-map FILE Read a copy number map from the BED file FILE, which has | |
743 either a sample-level ploidy: | |
744 sample_name copy_number | |
745 or a region-specific format: | |
746 seq_name start end sample_name copy_number | |
747 ... for each region in each sample which does not have the | |
748 default copy number as set by --ploidy. These fields can be delimited | |
749 by space or tab. | |
750 | |
751 **Output**:: | |
752 | |
753 --vcf FILE Output VCF-format results to FILE. (default: stdout) | |
754 --gvcf Write gVCF output, which indicates coverage in uncalled regions. | |
755 --gvcf-chunk NUM When writing gVCF output emit a record for every NUM bases. | |
756 --gvcf-dont-use-chunk When writing the gVCF output emit a record for all bases if | |
757 set to "true" , will also route an int to --gvcf-chunk | |
758 similar to --output-mode EMIT_ALL_SITES from GATK | |
759 --variant-input VCF Use variants reported in VCF file as input to the algorithm. | |
760 Variants in this file will included in the output even if | |
761 there is not enough support in the data to pass input filters. | |
762 --only-use-input-alleles Only provide variant calls and genotype likelihoods for sites | |
763 and alleles which are provided in the VCF input, and provide | |
764 output in the VCF for all input alleles, not just those which | |
765 have support in the data. | |
766 --haplotype-basis-alleles VCF When specified, only variant alleles provided in this input | |
767 VCF will be used for the construction of complex or haplotype | |
768 alleles. | |
769 --report-all-haplotype-alleles At sites where genotypes are made over haplotype alleles, | |
770 provide information about all alleles in output, not only | |
771 those which are called. | |
772 --report-monomorphic Report even loci which appear to be monomorphic, and report all | |
773 considered alleles, even those which are not in called genotypes. | |
774 Loci which do not have any potential alternates have '.' for ALT. | |
775 --pvar N Report sites if the probability that there is a polymorphism | |
776 at the site is greater than N. default: 0.0. Note that post- | |
777 filtering is generally recommended over the use of this parameter. | |
778 --strict-vcf Generate strict VCF format (FORMAT/GQ will be an int) | |
779 | |
780 **Population model**:: | |
781 | |
782 --theta N The expected mutation rate or pairwise nucleotide diversity | |
783 among the population under analysis. This serves as the | |
784 single parameter to the Ewens Sampling Formula prior model | |
785 default: 0.001 | |
786 --ploidy N Sets the default ploidy for the analysis to N. default: 2 | |
787 --pooled-discrete Assume that samples result from pooled sequencing. | |
788 Model pooled samples using discrete genotypes across pools. | |
789 When using this flag, set --ploidy to the number of | |
790 alleles in each sample or use the --cnv-map to define | |
791 per-sample ploidy. | |
792 --pooled-continuous Output all alleles which pass input filters, regardles of | |
793 genotyping outcome or model. | |
794 | |
795 **Reference allele**:: | |
796 | |
797 --use-reference-allele This flag includes the reference allele in the analysis as | |
798 if it is another sample from the same population. | |
799 --reference-quality MQ,BQ Assign mapping quality of MQ to the reference allele at each | |
800 site and base quality of BQ. default: 100,60 | |
801 | |
802 **Allele scope**:: | |
803 | |
804 --use-best-n-alleles N Evaluate only the best N SNP alleles, ranked by sum of | |
805 supporting quality scores. (Set to 0 to use all; default: all) | |
806 --max-complex-gap | |
807 --haplotype-length N Allow haplotype calls with contiguous embedded matches of up | |
808 to this length. Set N=-1 to disable clumping. (default: 3) | |
809 --min-repeat-size When assembling observations across repeats, require the total repeat | |
810 length at least this many bp. (default: 5) | |
811 --min-repeat-entropy N To detect interrupted repeats, build across sequence until it has | |
812 entropy > N bits per bp. Set to 0 to turn off. (default: 1) | |
813 --no-partial-observations Exclude observations which do not fully span the dynamically-determined | |
814 detection window. (default, use all observations, dividing partial | |
815 support across matching haplotypes when generating haplotypes.) | |
816 | |
817 **Indel realignment**:: | |
818 | |
819 --dont-left-align-indels Turn off left-alignment of indels, which is enabled by default. | |
820 | |
821 **Input filters**:: | |
822 | |
823 --use-duplicate-reads Include duplicate-marked alignments in the analysis. | |
824 default: exclude duplicates marked as such in alignments | |
825 --min-mapping-quality Q Exclude alignments from analysis if they have a mapping | |
826 quality less than Q. default: 1 | |
827 --min-base-quality Q Exclude alleles from analysis if their supporting base | |
828 quality is less than Q. default: 0 | |
829 --min-supporting-allele-qsum Q Consider any allele in which the sum of qualities of supporting | |
830 observations is at least Q. default: 0 | |
831 --min-supporting-mapping-qsum Q Consider any allele in which and the sum of mapping qualities of | |
832 supporting reads is at least Q. default: 0 | |
833 --mismatch-base-quality-threshold Q Count mismatches toward --read-mismatch-limit if the base | |
834 quality of the mismatch is >= Q. default: 10 | |
835 --read-mismatch-limit N Exclude reads with more than N mismatches where each mismatch | |
836 has base quality >= mismatch-base-quality-threshold. | |
837 default: ~unbounded | |
838 --read-max-mismatch-fraction N Exclude reads with more than N [0,1] fraction of mismatches where | |
839 each mismatch has base quality >= mismatch-base-quality-threshold | |
840 default: 1.0 | |
841 --read-snp-limit N Exclude reads with more than N base mismatches, ignoring gaps | |
842 with quality >= mismatch-base-quality-threshold. | |
843 default: ~unbounded | |
844 --read-indel-limit N Exclude reads with more than N separate gaps. | |
845 default: ~unbounded | |
846 --standard-filters Use stringent input base and mapping quality filters | |
847 Equivalent to -m 30 -q 20 -R 0 -S 0 | |
848 --min-alternate-fraction N Require at least this fraction of observations supporting | |
849 an alternate allele within a single individual in the | |
850 in order to evaluate the position. default: 0.05 | |
851 --min-alternate-count N Require at least this count of observations supporting | |
852 an alternate allele within a single individual in order | |
853 to evaluate the position. default: 2 | |
854 --min-alternate-qsum N Require at least this sum of quality of observations supporting | |
855 an alternate allele within a single individual in order | |
856 to evaluate the position. default: 0 | |
857 --min-alternate-total N Require at least this count of observations supporting | |
858 an alternate allele within the total population in order | |
859 to use the allele in analysis. default: 1 | |
860 --min-coverage N Require at least this coverage to process a site. default: 0 | |
861 --limit-coverage N Downsample per-sample coverage to this level if greater than this coverage. | |
862 default: no limit | |
863 --skip-coverage N Skip processing of alignments overlapping positions with coverage >N. | |
864 This filters sites above this coverage, but will also reduce data nearby. | |
865 default: no limit | |
866 | |
867 **Population priors**:: | |
868 | |
869 --no-population-priors Equivalent to --pooled-discrete --hwe-priors-off and removal of | |
870 Ewens Sampling Formula component of priors. | |
871 | |
872 **Mappability priors**:: | |
873 | |
874 --hwe-priors-off Disable estimation of the probability of the combination | |
875 arising under HWE given the allele frequency as estimated | |
876 by observation frequency. | |
877 --binomial-obs-priors-off Disable incorporation of prior expectations about observations. | |
878 Uses read placement probability, strand balance probability, | |
879 and read position (5'-3') probability. | |
880 --allele-balance-priors-off Disable use of aggregate probability of observation balance between alleles | |
881 as a component of the priors. | |
882 | |
883 **Genotype likelihoods**:: | |
884 | |
885 --observation-bias FILE Read length-dependent allele observation biases from FILE. | |
886 The format is [length] [alignment efficiency relative to reference] | |
887 where the efficiency is 1 if there is no relative observation bias. | |
888 --base-quality-cap Q Limit estimated observation quality by capping base quality at Q. | |
889 --prob-contamination F An estimate of contamination to use for all samples. default: 10e-9 | |
890 --legacy-gls Use legacy (polybayes equivalent) genotype likelihood calculations | |
891 --contamination-estimates FILE A file containing per-sample estimates of contamination, such as | |
892 those generated by VerifyBamID. The format should be: | |
893 sample p(read=R|genotype=AR) p(read=A|genotype=AA) | |
894 Sample '*' can be used to set default contamination estimates. | |
895 | |
896 **Algorithmic features**:: | |
897 | |
898 --report-genotype-likelihood-max Report genotypes using the maximum-likelihood estimate provided | |
899 from genotype likelihoods. | |
900 --genotyping-max-iterations N Iterate no more than N times during genotyping step. default: 1000. | |
901 --genotyping-max-banddepth N Integrate no deeper than the Nth best genotype by likelihood when | |
902 genotyping. default: 6. | |
903 --posterior-integration-limits N,M Integrate all genotype combinations in our posterior space | |
904 which include no more than N samples with their Mth best | |
905 data likelihood. default: 1,3. | |
906 --exclude-unobserved-genotypes Skip sample genotypings for which the sample has no supporting reads. | |
907 --genotype-variant-threshold N Limit posterior integration to samples where the second-best | |
908 genotype likelihood is no more than log(N) from the highest | |
909 genotype likelihood for the sample. default: ~unbounded | |
910 --use-mapping-quality Use mapping quality of alleles when calculating data likelihoods. | |
911 --harmonic-indel-quality Use a weighted sum of base qualities around an indel, scaled by the | |
912 distance from the indel. By default use a minimum BQ in flanking sequence. | |
913 --read-dependence-factor N Incorporate non-independence of reads by scaling successive | |
914 observations by this factor during data likelihood | |
915 calculations. default: 0.9 | |
916 --genotype-qualities Calculate the marginal probability of genotypes and report as GQ in | |
917 each sample field in the VCF output. | |
918 | |
919 ------ | |
920 | |
683 **Acknowledgments** | 921 **Acknowledgments** |
684 | 922 |
685 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko. | 923 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko. |
686 TNG was developed by Bjoern Gruening. | 924 TNG was developed by Bjoern Gruening. |
925 ]]> | |
687 </help> | 926 </help> |
688 <expand macro="citations"> | 927 <expand macro="citations"> |
689 <citation type="bibtex"> | 928 <citation type="bibtex"> |
690 @article{Tange2011a, | 929 @article{Tange2011a, |
691 title = {GNU Parallel - The Command-Line Power Tool}, | 930 title = {GNU Parallel - The Command-Line Power Tool}, |