diff gatk4_Mutect2.xml @ 6:fb0bb7174530 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gatk4 commit 301f94b20e29da22d5f4502c44344f4a0115930d
author iuc
date Wed, 24 Aug 2022 17:59:05 +0000
parents 53ce8be43212
children
line wrap: on
line diff
--- a/gatk4_Mutect2.xml	Wed Oct 06 12:05:42 2021 +0000
+++ b/gatk4_Mutect2.xml	Wed Aug 24 17:59:05 2022 +0000
@@ -1,4 +1,4 @@
-<tool id="gatk4_mutect2" name="GATK4 Mutect2" version="@WRAPPER_VERSION@" profile="18.05">
+<tool id="gatk4_mutect2" name="GATK4 Mutect2" version="@WRAPPER_VERSION@+galaxy1" profile="18.05">
     <description>- Call somatic SNVs and indels via local assembly of haplotypes</description>
     <macros>
         <import>macros.xml</import>
@@ -248,6 +248,7 @@
             --minimum-allele-fraction="$advanced.minimum_allele_fraction"
             --num-pruning-samples="$advanced.num_pruning_samples"
             --pair-hmm-gap-continuation-penalty="$advanced.pair_hmm_gap_continuation_penalty"
+            --callable-depth="$advanced.callable_depth"
             --pair-hmm-implementation="$advanced.pair_hmm_implementation"
             --pcr-indel-model="$advanced.pcr_indel_model"
             --phred-scaled-global-read-mismapping-rate="$advanced.phred_scaled_global_read_mismapping_rate"
@@ -411,7 +412,6 @@
                 <param name="pedigree" argument="--pedigree" type="data" optional="true" format="vcf,vcf_bgzip" label="Pedigree" help="Pedigree file for determining the population &quot;founders&quot;. If a file is provided here, a pedigree-based annotation must be added above."/>
                 <param name="base_quality_score_threshold" argument="--base-quality-score-threshold" type="integer" optional="true" value="18" label="Base Quality Score Threshold" help="Base qualities below this threshold will be reduced to the minimum (6)"/>
                 <param name="callable_depth" argument="--callable-depth" type="integer" optional="true" value="10" label="Minimum depth to be considered callable" help="Does not affect genotyping"/>
-                <param name="contamination_fraction_to_filter" argument="--contamination-fraction-to-filter" type="float" optional="true" value="0.0" label="Contamination Fraction To Filter" help="Fraction of contamination in sequencing data (for all samples) to aggressively remove"/>
                 <param name="disable_bam_index_caching" argument="--disable-bam-index-caching" type="boolean" truevalue="--disable-bam-index-caching" falsevalue="" optional="true" checked="false" label="Disable Bam Index Caching" help="If true, don&amp;apos;t cache bam indexes, this will reduce memory requirements but may harm performance if many intervals are specified.  Caching is automatically disabled if there are no intervals specified."/>
                 <param name="disable_read_filter" argument="--disable-read-filter" type="select" multiple="true" value="" label="Disable Read Filter" help="Read filters to be disabled before analysis">
                     <option value="GoodCigarReadFilter">Good cigar string</option>
@@ -472,10 +472,7 @@
                 <param name="genotype_pon_sites" argument="--genotype-pon-sites" type="boolean" truevalue="--genotype-pon-sites" falsevalue="" optional="true" checked="false" label="Genotype PoN Sites" help="Call sites in the PoN even though they will ultimately be filtered."/>
                 <param name="alleles" argument="--alleles" type="data" optional="true" format="vcf" label="Alleles" help="The set of alleles at which to genotype"/>
                 <param name="germline_resource" argument="--germline-resource" type="data" optional="true" format="vcf,vcf_bgzip" label="Germline Resource" help="Population vcf of germline sequencing containing allele fractions."/>
-                <param name="heterozygosity" argument="--heterozygosity" type="float" optional="true" value="0.001" label="Heterozygosity" help="The expected heterozygosity value used to compute prior probability that a locus is non-reference. The default priors are for provided for humans: het = 1e-3 which means that the probability of N samples being hom-ref at a site is: 1 - sum_i_2N (het / i) Note that heterozygosity as used here is the population genetics concept: http://en.wikipedia.org/wiki/Zygosity#Heterozygosity_in_population_genetics That is, a hets value of 0.01 implies that two randomly chosen chromosomes from the population of organisms would differ from each other (one being A and the other B) at a rate of 1 in 100 bp. Note that this quantity has nothing to do with the likelihood of any given sample having a heterozygous genotype, which in the GATK is purely determined by the probability of the observed data P(D | AB) under the model that there may be a AB het genotype. The posterior probability of this AB genotype would use the het prior, but the GATK only uses this posterior probability in determining the prob. that a site is polymorphic. So changing the het parameters only increases the chance that a site will be called non-reference across all samples, but doesn't actually change the output genotype likelihoods at all, as these aren't posterior probabilities at all. The quantity that changes whether the GATK considers the possibility of a het genotype at all is the ploidy, which determines how many chromosomes each individual in the species carries."/>
-                <param name="heterozygosity_stdev" argument="--heterozygosity-stdev" type="float" optional="true" value="0.01" label="Heterozygosity Stdev" help="Standard deviation of heterozygosity for SNP and indel calling."/>
                 <param name="ignore_itr_artifacts" argument="--ignore-itr-artifacts" type="boolean" truevalue="--ignore-itr-artifacts" falsevalue="" optional="true" checked="false" label="Turn off read transformer that clips artifacts associated with end repair insertions near inverted tandem repeats" />
-                <param name="indel_heterozygosity" argument="--indel-heterozygosity" type="float" optional="true" value="0.000125" label="Indel Heterozygosity" help="Heterozygosity for indel calling.  See the GATKDocs for heterozygosity for full details on the meaning of this population genetics concept"/>
                 <param name="initial_tumor_lod" argument="--initial-tumor-lod" type="float" optional="true" value="2.0" label="Initial Tumor Lod" help="LOD threshold to consider pileup active."/>
                 <param name="interval_exclusion_padding" argument="--interval-exclusion-padding" type="integer" value="0" label="Interval exclusion padding" help="Amount of padding (in bp) to add to each interval you are excluding" />
                 <param name="interval_padding" argument="--interval-padding" type="integer" value="0" label="Interval padding" help="Amount of padding (in bp) to add to each interval you are including" />
@@ -585,7 +582,6 @@
                 <option value="yes">Generate debugging information</option>
             </param>
             <when value="yes">
-                <param name="debug_activity" argument="--activity-profile-out" type="boolean" checked="false" truevalue="yes" falsevalue="" label="Activity Profile Out" help="Output the raw activity profile results in IGV format"/>
                 <param name="debug_assembly" argument="--assembly-region-out" type="boolean" checked="false" truevalue="yes" falsevalue="" label="Assembly Region Out" help="Output the assembly region to this IGV formatted file"/>
                 <param name="debug_bam" argument="--bam-output" type="boolean" checked="false" truevalue="yes" falsevalue="" label="Bam Output" help="The assembled haplotypes and locally realigned reads will be written as BAM to this file if requested. This is intended to be used only for troubleshooting purposes, in specific areas where you want to better understand why the caller is making specific calls"/>
             </when>