# HG changeset patch # User superyuan # Date 1404139794 14400 # Node ID 85bdf226b67b98d73dc65d0b21ddaf9a46f0685d # Parent 9259f293935793a95d990f452603d3a3dc8b7bed add vcf2genotypes and test-data diff -r 9259f2939357 -r 85bdf226b67b test-data/hg19test.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/hg19test.fa Mon Jun 30 10:49:54 2014 -0400 @@ -0,0 +1,12 @@ +>chr1 +NNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNNN +TCAGTGTCCTCCCATGGATGTTAATGTTCTCCATATGATGTCAGTGTCCT +CCATATGATGTCAGTGTCCTCCATATGACATCAATATCCTCCATATGATA +TCAATATCCTCTGTATTGATATTGATATTGATATTTGGAGGATATCAATA +TCCTCCAAATGATGTCAGTGTCCTCCATATGATGTCAATGTCCTCCATAT +GATGTCAATATCCTCCGTATGATGTCAATATCCTCCGTATGATGTCAATA +TCCTCCATATGATGTCAGTGTCCTCTGTATGACATCAATATCCTCCATAC +GATGCCCCTGTCCTTCATATGATGTCAGTGTCCTTTTGTGAGCACCAGTG +TCCTTTGTATGACATCAGTAGTCTCCCATGAATGTCACTGTCTTCCCATA +GATGTCAGTGTCCTCTccaaaagacaagcagaagctgttcatggaatgat +gtgggggaaccttccagaaagaggcaacatcatgtgctaaggtcccaggt diff -r 9259f2939357 -r 85bdf226b67b test-data/test.fastq --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test.fastq Mon Jun 30 10:49:54 2014 -0400 @@ -0,0 +1,4 @@ +@ERR000038.1 BGI-FC302WFAAXX_5_1_1204:1431 +CCTTCATATGATGTCAGAGTCCTCTGTATGACCTCA ++ +IIIIII$IIII(IIIIIIIIIIIII2@IIIII:I>& diff -r 9259f2939357 -r 85bdf226b67b test-data/test.vcf --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/test.vcf Mon Jun 30 10:49:54 2014 -0400 @@ -0,0 +1,8 @@ +##fileformat=VCFv4.0 +##fileDate=20110201 +##reference=NCBI37 +##source=Affymetrix_Axiom_DB +##FORMAT= +#CHROM POS ID REF ALT QUAL FILTER INFO FORMAT NA18501 NA18502 NA18504 NA18505 NA18507 NA18508 NA18516 NA18517 NA18522 NA18523 NA18852 NA18853 NA18855 NA18856 NA18858 NA18859 NA18861 NA18862 NA18870 NA18871 NA18912 NA18913 NA19092 NA19093 NA19098 NA19099 NA19101 NA19102 NA19116 NA19119 NA19127 NA19128 NA19130 NA19131 NA19137 NA19138 NA19140 NA19141 NA19143 NA19144 NA19152 NA19153 NA19159 NA19160 NA19171 NA19172 NA19192 NA19193 NA19200 NA19201 NA19203 NA19204 NA19206 NA19207 NA19209 NA19210 NA19222 NA19223 NA19238 NA19239 +1 305 rs5 C T . PASS . GT 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/0 0/1 0/1 0/0 +1 334 . A C . PASS . GT 0/0 0/0 ./. 0/0 ./. 0/0 ./. ./. 0/0 ./. 0/0 0/0 ./. 0/0 ./. 0/0 0/0 0/0 ./. ./. 0/0 ./. 0/0 0/0 ./. 0/0 ./. ./. ./. 0/0 0/0 ./. 0/0 0/0 0/0 ./. 0/0 0/0 0/0 ./. 0/0 ./. ./. 0/0 ./. 0/0 ./. 0/0 0/0 0/0 ./. ./. 0/0 0/0 0/0 ./. 0/0 0/0 0/1 0/0 diff -r 9259f2939357 -r 85bdf226b67b tool_conf.xml --- a/tool_conf.xml Thu Jun 12 04:56:10 2014 -0400 +++ b/tool_conf.xml Mon Jun 30 10:49:54 2014 -0400 @@ -1,6 +1,7 @@
+
diff -r 9259f2939357 -r 85bdf226b67b tools/refeditor/vcf2genotypes.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tools/refeditor/vcf2genotypes.py Mon Jun 30 10:49:54 2014 -0400 @@ -0,0 +1,66 @@ +# Filename: vcf2genotypes.py +# Author: Shuai Yuan +# Version: 06/29/2012 +# +# This script is a wrapper for vcf2genotypes +# +# vcf2genotypes is launched based on these inputs: +# -i input VCF file +# -p target individual +# -o output genotypes file + +import sys +import os +import re +import string +import commands +from tempfile import NamedTemporaryFile + +# This function is exceedingly useful, perhaps package for reuse? +def getopts(argv): + opts = {} + while argv: + if argv[0][0] == '-': + opts[argv[0]] = argv[1] + argv = argv[2:] + else: + argv = argv[1:] + return opts + +def main(): + args = sys.argv[1:] + + try: + opts = getopts(args) + except IndexError: + print "Usage:" + return 0 + + vcf = opts.get("-i") + if vcf == None: + print "No input VCF file specified." + return -1 + + individual = opts.get("-p") + if individual == None: + print "No valid individual specified." + return -2 + + outputfile = opts.get("-o") + if outputfile == None: + print "No output file specified." + return -6 + + +# All inputs have been specified at this point, now validate. + + #generate command + commandline = "vcf2genotypes %s %s > %s " % (vcf, individual, outputfile) + #run + errorcode, stdout = commands.getstatusoutput(commandline) + + #return error code + return errorcode + +if __name__ == "__main__": + main() diff -r 9259f2939357 -r 85bdf226b67b tools/refeditor/vcf2genotypes.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tools/refeditor/vcf2genotypes.xml Mon Jun 30 10:49:54 2014 -0400 @@ -0,0 +1,18 @@ + + Extracts genotypes for a particular individual from VCF File + vcf2genotypes.py + -i '$input' + -p '$person' + -o $out_file1 + + + + + + + + + + + +