Mercurial > repos > dannon > metaphlan
comparison metaphlan2krona.py @ 6:e951f9d38339 default tip
Added metaphlan2krona
| author | Dannon Baker <dannonbaker@me.com> | 
|---|---|
| date | Tue, 08 Apr 2014 14:16:46 -0400 | 
| parents | |
| children | 
   comparison
  equal
  deleted
  inserted
  replaced
| 5:73f082e9fa2d | 6:e951f9d38339 | 
|---|---|
| 1 #!/usr/bin/env python | |
| 2 | |
| 3 # ============================================================================== | |
| 4 # Conversion script: from MetaPhlAn output to Krona text input file | |
| 5 # Author: Daniel Brami (daniel.brami@gmail.com) | |
| 6 # ============================================================================== | |
| 7 | |
| 8 import sys | |
| 9 import optparse | |
| 10 import re | |
| 11 | |
| 12 def main(): | |
| 13 #Parse Command Line | |
| 14 parser = optparse.OptionParser() | |
| 15 parser.add_option( '-p', '--profile', dest='profile', default='', action='store', help='The input file is the MetaPhlAn standard result file' ) | |
| 16 parser.add_option( '-k', '--krona', dest='krona', default='krona.out', action='store', help='the Krona output file name' ) | |
| 17 ( options, spillover ) = parser.parse_args() | |
| 18 | |
| 19 if not options.profile or not options.krona: | |
| 20 parser.print_help() | |
| 21 sys.exit() | |
| 22 | |
| 23 re_candidates = re.compile(r"s__|unclassified\t") | |
| 24 re_replace = re.compile(r"\w__") | |
| 25 re_bar = re.compile(r"\|") | |
| 26 | |
| 27 metaPhLan = list() | |
| 28 with open(options.profile,'r') as f: | |
| 29 metaPhLan = f.readlines() | |
| 30 f.close() | |
| 31 | |
| 32 krona_tmp = options.krona | |
| 33 metaPhLan_FH = open(krona_tmp, 'w') | |
| 34 | |
| 35 for aline in (metaPhLan): | |
| 36 if(re.search(re_candidates, aline)): | |
| 37 x=re.sub(re_replace, '\t', aline) | |
| 38 x=re.sub(re_bar, '', x) | |
| 39 | |
| 40 x_cells = x.split('\t') | |
| 41 lineage = '\t'.join(x_cells[0:(len(x_cells) -1)]) | |
| 42 abundance = float(x_cells[-1].rstrip('\n')) | |
| 43 | |
| 44 metaPhLan_FH.write('%s\n'%(str(abundance) + '\t' + lineage)) | |
| 45 | |
| 46 metaPhLan_FH.close() | |
| 47 | |
| 48 if __name__ == '__main__': | |
| 49 main() | 
