comparison DC_Genotyper.xml @ 0:e8a32d824f39 draft

Uploaded
author geert-vandeweyer
date Thu, 25 Sep 2014 05:24:35 -0400
parents
children fa8566bd4a51
comparison
equal deleted inserted replaced
-1:000000000000 0:e8a32d824f39
1 <tool id="Paired_fastQ_trimmer" name="Paired FastQ QC-Trimmer" >
2 <description></description>
3 <requirements>
4 <requirement type='package' version='3.0.2'>R</requirement>
5 <requirement type='package' version='0.1.18'>samtools</requirement>
6 <requirement type='package' version='0.2.6'>tabix</requirement>
7 <requirement type='package' version='latest'>twoBitToFa</requirement>
8 <requirement type='package' version='1.92'>perl_module_threads</requirement>
9 <requirement type='package' version='1.46'>perl_module_threads_shared</requirement>
10 <requirement type='package' version='3.02'>perl_module_Thread_Queue</requirement>
11 <requirement type='package' version='2.3.32'>igvtools</requirement>
12 </requirements>
13 <command interpreter="perl">DC_Genotyper.pl
14 -t "$targets"
15 -b "$bamfile"
16 -R "${ref.fields.path}"
17 -p "\${GALAXY_SLOTS:-4}"
18 #if $dbsnp.source == "history":
19 -s "${dbsnp.ownFile}"
20 #else
21 -s "${dbsnp.indices.fields.path}"
22 #end if
23 -m $mincov
24 -P $ploidy
25
26 -a $output1
27 -v $output2
28 </command>
29
30 <inputs>
31 <param name="bamfile" type="data" format="bam" label="Sample BAM file" />
32 <param name="targets" type="data" format="bed" label="Enrichment BED file" />
33 <param name="ref" type="select" label="Select a reference genome">
34 <options from_data_table="DC_Genotyper_indexes">
35 <filter type="sort_by" column="2" />
36 <validator type="no_options" message="No indexes are available" />
37 </options>
38 </param>
39 <conditional name="dbsnp">
40 <param name="source" type="select" label="Will you select a dbSNP file from your history, or use a built in version (which is faster)">
41 <option value="indexed">Use a built-in version</option>
42 <option value="history">Use one from the history</option>
43 </param>
44 <when value="indexed">
45 <param name="indices" type="select" label="Select a reference genome">
46 <options from_data_table="dbsnp_indexes">
47 <filter type="sort_by" column="2" />
48 <validator type="no_options" message="No indexes are available" />
49 </options>
50 </param>
51 </when>
52 <when value="history">
53 <param name="ownFile" type="data" format="vcf,bcf" label="Select a dbSNP file from history"/>
54 </when>
55 </param>
56 </conditional>
57 <param name="mincov" value="400" type="integer" label="Minimal Coverage Depth" />
58 <param name="ploidy" type="integer" value='10' label="Expected Sample Ploidy" />
59 </inputs>
60
61 <outputs>
62 <data format='txt' name="output1" label="${tool.name} on ${on_string}: Allele Fraction Distributions"/>
63 <data format='vcf' name='output2' label="${tool.name} on ${on_string}: VCF file">
64 </outputs>
65 <help>
66
67 **What it does**
68
69 1. get allele counts on all positions in specified targets (bed) using igvtools. Only SNPs !!
70 2. remove known dbsnp positions (bcf file)
71 3. Get distribution of background noise (pcr/sequencing errors), by modelling allele fractions as normal distributions.
72 4. Based on these distributions, check each position for significant change from the reference allele (based on allele fraction)
73 5. For abberant positions, check each alternate allele to see if it passes the background signal.
74 6. Generate VCF file.
75
76
77 **Information**
78
79 This tools is created by Geert Vandeweyer. It is a very early version with several limitations. Current limitations are : no support for indels, no plotting of the noise-models, incorrect syntax in for multi-allelic sites in the VCF file.
80
81 Any feedback is welcome.
82
83 </help>
84 </tool>