1
|
1 <?xml version="1.0"?>
|
|
2 <tool id="vcf2gff_1" name="Convert vcf to gff">
|
|
3 <description>Convert vcf to gff</description>
|
|
4 <command interpreter="python">vcf_gff.py $inputVcf $outputfile</command>
|
|
5 <inputs>
|
|
6 <param format="vcf" name="inputVcf" type="data" label="vcf file containing SNP data"/>
|
|
7 </inputs>
|
|
8 <outputs>
|
|
9 <data format="gff3" name="outputfile" />
|
|
10 </outputs>
|
5
|
11 <tests>
|
|
12 <test>
|
|
13 <param name="inputVcf" value="mpileup_out.vcf" ftype="vcf"/>
|
|
14 <output name="outputfile" file="mpileup_vcf_to_gff_output.gff"/>
|
|
15 </test>
|
|
16 <test>
|
|
17 <param name="inputVcf" value="freebayes_out.vcf" ftype="vcf"/>
|
|
18 <output name="outputfile" file="freebayes_vcf_to_gff_output.gff"/>
|
|
19 </test>
|
|
20 </tests>
|
1
|
21 <help>
|
|
22
|
|
23 ** Convert vcf to gff3**
|
|
24
|
|
25 This tool takes vcf output from Samtools mpileup and converts to gff3 format.
|
|
26 It converts a single vcf output file containing output from a single bam file or from multiple bam files.
|
|
27 Read counts and GT scores are used as an indicator of whether a mutation is homozygous or heterozygous and outputs in the INFO section.
|
|
28
|
|
29 **TIP**
|
|
30 mpileup **must** be run with Genotype Likelihood Computation selected (-g flag)to generate the GT flag in BCF/VCF output.
|
|
31 This then used to estimate the SNP presence in one or more samples.
|
|
32 More info is available in the manual pages at: http://samtools.sourceforge.net/mpileup.shtml
|
|
33
|
|
34
|
|
35 **Example**
|
|
36
|
|
37 --input vcf
|
|
38
|
|
39 ::
|
|
40
|
|
41 #CHROM POS ID REF ALT QUAL FILTER INFO FORMAT bam
|
|
42 PGSC0003DMB000000001 430 . A T 3.41 . DP=4;AF1=0.9904;CI95=0.125,1;DP4=0,0,2,0;MQ=17 PL:DP:GT:GQ 32,6,0:2:1/1:23
|
|
43 PGSC0003DMB000000001 445 . G T 3.41 . DP=4;AF1=0.9904;CI95=0.125,1;DP4=0,0,2,0;MQ=17 PL:DP:GT:GQ 32,6,0:2:1/1:23
|
|
44 PGSC0003DMB000000001 446 . G A 3.41 . DP=4;AF1=0.9904;CI95=0.125,1;DP4=0,0,2,0;MQ=17 PL:DP:GT:GQ 32,6,0:2:1/1:23
|
|
45 PGSC0003DMB000000001 452 . C T 3.41 . DP=4;AF1=0.9904;CI95=0.125,1;DP4=0,0,2,0;MQ=17 PL:DP:GT:GQ 32,6,0:2:1/1:23
|
|
46
|
|
47 --output gff
|
|
48
|
|
49 ::
|
|
50
|
|
51 #CHROM SOURCE TYPE START STOP QUAL STRAND PHASE INFO
|
|
52 PGSC0003DMB000000001 SAMTOOLS SNP 430 430 3.41 . . ID=PGSC0003DMB000000001:SNP:430;Variant_seq=T;Reference_seq=A;Total_reads=4:Zygosity=2:HOM_mut
|
|
53 PGSC0003DMB000000001 SAMTOOLS SNP 445 445 3.41 . . ID=PGSC0003DMB000000001:SNP:445;Variant_seq=T;Reference_seq=G;Total_reads=4:Zygosity=2:HOM_mut
|
|
54 PGSC0003DMB000000001 SAMTOOLS SNP 446 446 3.41 . . ID=PGSC0003DMB000000001:SNP:446;Variant_seq=A;Reference_seq=G;Total_reads=4:Zygosity=2:HOM_mut
|
|
55 PGSC0003DMB000000001 SAMTOOLS SNP 452 452 3.41 . . ID=PGSC0003DMB000000001:SNP:452;Variant_seq=T;Reference_seq=C;Total_reads=4:Zygosity=2:HOM_mut
|
|
56
|
|
57
|
|
58
|
|
59 -----------------------
|
|
60
|
|
61 *If you use this tool please cite:*
|
|
62
|
|
63 A Toolkit For Bulk PCR-Based Marker Design From Next-Generation Sequence Data:
|
|
64 Application For Development Of A Framework Linkage Map In Bulb Onion (*Allium cepa* L.)
|
|
65 (2012)
|
|
66
|
|
67 Samantha Baldwin, Roopashree Revanna, Susan Thomson, Meeghan Pither-Joyce, Kathryn Wright,
|
|
68 Ross Crowhurst, Mark Fiers, Leshi Chen, Richard MacKnight, John A. McCallum
|
|
69
|
|
70 </help>
|
5
|
71 </tool>
|