0
|
1 # ----------------------------------------------------------------------#
|
|
2 # Copyright (c) 2011, Richard Lupat & Jason Li.
|
|
3 #
|
|
4 # > Source License <
|
|
5 # This file is part of CONTRA.
|
|
6 #
|
|
7 # CONTRA is free software: you can redistribute it and/or modify
|
|
8 # it under the terms of the GNU General Public License as published by
|
|
9 # the Free Software Foundation, either version 3 of the License, or
|
|
10 # (at your option) any later version.
|
|
11 #
|
|
12 # CONTRA is distributed in the hope that it will be useful,
|
|
13 # but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
14 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
15 # GNU General Public License for more details.
|
|
16 #
|
|
17 # You should have received a copy of the GNU General Public License
|
|
18 # along with CONTRA. If not, see <http://www.gnu.org/licenses/>.
|
|
19 #
|
|
20 #
|
|
21 #-----------------------------------------------------------------------#
|
|
22 # Last Updated : 05 October 2011 16:43PM
|
|
23
|
|
24
|
|
25 import subprocess, shlex
|
|
26
|
|
27 def get_genome(srcFile, genomeOut):
|
|
28 genome = open(genomeOut, "w")
|
|
29
|
|
30 args = shlex.split("samtools view -H %s" %(srcFile))
|
|
31 raw_header = subprocess.Popen(args, stdout = subprocess.PIPE).communicate()[0]
|
|
32 headers = raw_header.split("\n")
|
|
33
|
|
34 for header in headers:
|
|
35 header = header.split("\t")
|
|
36 if header[0][1:] != "SQ":
|
|
37 continue
|
|
38
|
|
39 genome.write(header[1].strip("SN:") + "\t" + header[2].strip("LN:") + "\n")
|
|
40
|
|
41 genome.close()
|
|
42
|
|
43
|