Mercurial > repos > xuebing > sharplabtool
view tools/human_genome_variation/freebayes.xml @ 1:cdcb0ce84a1b
Uploaded
author | xuebing |
---|---|
date | Fri, 09 Mar 2012 19:45:15 -0500 |
parents | 9071e359b9a3 |
children |
line wrap: on
line source
<?xml version="1.0"?> <tool id="freebayes_wrapper" name="Call SNPS with Freebayes" version="0.5.0"> <requirements> <requirement type="package">freebayes</requirement> </requirements> <description>Bayesian genetic variant detector</description> <command> ln -s $reference localref.fa; ln -s $bamfile localbam.bam; samtools faidx localref.fa; samtools sort localbam.bam localbam.bam; samtools index localbam.bam; freebayes --fasta-reference localref.fa localbam.bam --vcf $output #if $params.source_select == "full": $params.showRefRepeats -T $params.theta -p $params.ploidy $params.pooled $params.mnps $params.nosnps -n $params.bestAlleles $params.allAlleles $params.duplicateReads -M $params.refMapQuality $params.ignoreRefAllele $params.haploidReference -m $params.minMapQuality -q $params.minBaseQuality $params.noFilters -x $params.indelExclusionWindow <!-- -D $readDependenceFactor --> -V $params.diffusionPriorScalar -W $params.postIntegBandwidth -Y $params.postIntegBanddepth -F $params.minAltFraction -C $params.minAltCount -G $params.minAltTotal --min-coverage $params.minCoverage #end if </command> <inputs> <param format="fasta" name="reference" type="data" metadata_name="dbkey" label="Reference File"/> <param format="bam" name="bamfile" type="data" label="Bam Alignment File"/> <conditional name="params"> <param name="source_select" type="select" label="Freebayes Settings to Use" help="For straight forward mapping needs use Commonly Used settings. If you want full control use Full Parameter List"> <option value="pre_set">Commonly Used</option> <option value="full">Full Parameter List</option> </param> <when value="pre_set"/> <when value="full"> <param name="indels" type="select" label="Include insertion and deletion alleles in the analysis"> <option value="">No</option> <option value="-i -N --report-all-alternates --left-align-indels">Yes</option> </param> <param name="theta" size="5" type="float" value="0.001" label="Theta" help="The expected mutation rate or pairwise nucleotide diversity among the population under analysis. This serves as the single parameter to the Ewens Sampling Formula prior model"/> <param name="showRefRepeats" type="select" label="Show Reference Repeats" help="Calculate and show information about reference repeats in the VCF output"> <option value="">No</option> <option value="-_">Yes</option> </param> <param name="ploidy" size="5" type="integer" value="2" label="Ploidy" help="Sets the default ploidy for the analysis"/> <param name="pooled" type="select" label="Pooled" help="Assume that samples result from pooled sequencing. When using this flag, set --ploidy to the number of alleles in each sample"> <option value="">No</option> <option value="-J">Yes</option> </param> <param name="mnps" type="select" label="Include multi-nuceotide polymorphisms in the analysis"> <option value="">No</option> <option value="--mnps">Yes</option> </param> <param name="nosnps" type="select" label="Ignore SNP alleles"> <option value="">No</option> <option value="--no-snps">Yes</option> </param> <param name="duplicateReads" type="select" label="Include duplicate-marked alignments in the analysis"> <option value="">No</option> <option value="--use-duplicate-reads">Yes</option> </param> <param name="bestAlleles" size="5" type="integer" value="2" label="Use Best N Alleles" help="Evaluate only the best N alleles, ranked by sum of supporting quality scores"/> <param name="allAlleles" type="select" label="Evaluate all possible alleles"> <option value="">No</option> <option value="--use-all-alleles">Yes</option> </param> <param name="refMapQuality" size="5" type="integer" value="100" label="Assign mapping quality of Q to the reference allele at each site"/> <param name="refBaseQuality" size="5" type="integer" value="60" label="Reference Base Quality" help="Assign a base quality of Q to the reference allele at each site"/> <param name="minMapQuality" size="5" type="integer" value="10" label="Minimum Mapping Quality" help="Exclude alignments from analysis if they have a mapping quality less than Q"/> <param name="minBaseQuality" size="5" type="integer" value="5" label="Minimum Base Quality" help="Exclude alleles from analysis if their supporting base quality is less than Q"/> <param name="indelExclusionWindow" size="5" type="integer" value="0" label="Indel Exclusion Window" help="Ignore portions of alignments N bases from a putative insertion or deletion allele"/> <param name="ignoreRefAllele" type="select" label="Ignore Reference Allele" help="By default, the reference allele is considered as another sample. This flag excludes it from the analysis"> <option value="">No</option> <option value="--ignore-reference-allele">Yes</option> </param> <param name="haploidReference" type="select" label="Haploid Reference" help="If using the reference sequence as a sample, consider it to be haploid"> <option value="">No</option> <option value="--haploid-reference">Yes</option> </param> <param name="noFilters" type="select" label="No Filters" help="Do not use any input base and mapping quality filters. Equivalent to -m 0 -q 0 -R 0 -S 0"> <option value="">No</option> <option value="--no-filters">Yes</option> </param> <!-- <param name="readDependenceFactor" size="5" type="float" value="0.9" label="Read Dependence Factor" help="Incorporate non-independence of reads by scaling successive observations by this factor during data likelihood calculations"/> --> <param name="diffusionPriorScalar" size="5" type="float" value="1" label="Diffusion Prior Scalar" help="Downgrade the significance of P(genotype combo | allele frequency) by taking the Nth root of this component of the prior"/> <param name="postIntegBandwidth" size="5" type="integer" value="2" label="Posterior Integratoin Bandwidth" help="Integrate all genotype combinations in our posterior space which lie no more than N steps from the most likely combination in terms of data likelihoods, taking the N steps from the most to least likely genotype for each individual"/> <param name="postIntegBanddepth" size="5" type="integer" value="2" label="Posterior Integratoin Banddepth" help="Generate all genotype combinations for which up to this number of samples have up to their -W'th worst genotype according to data likelihood"/> <param name="minAltFraction" size="5" type="integer" value="0" label="Minimum Alternative Fraction" help="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position"/> <param name="minAltCount" size="5" type="integer" value="1" label="Minimum Alternative Count" help="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position"/> <param name="minAltTotal" size="5" type="integer" value="1" label="Minimum Alternative Total" help="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis"/> <param name="minCoverage" size="5" type="integer" value="0" label="Minimum Coverage" help="Require at least this coverage to process a site"/> </when> </conditional> </inputs> <outputs> <data format="vcf" name="output" metadata_source="reference" /> </outputs> <tests> <test> <param name="reference" ftype="fasta" value="mosaik_test_ref.fasta"/> <param name="bamfile" ftype="bam" value="freebayes_in.bam"/> <param name="source_select" value="pre_set"/> <output name="output" file="freebayes_out.vcf" lines_diff="4"/> </test> </tests> <help> This tool uses Freebayes to call SNPS given a reference sequence and a BAM alignment file. </help> </tool>