Mercurial > repos > bgruening > minced
diff reformat.py @ 0:20f12e7c279b draft
Imported from capsule None
author | bgruening |
---|---|
date | Mon, 05 May 2014 04:23:26 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/reformat.py Mon May 05 04:23:26 2014 -0400 @@ -0,0 +1,24 @@ +#!/usr/bin/env python + +""" + Extract importent information from the standard output file and put it in some standard format, like BED and tabular. +""" + +import sys + +bed = open(sys.argv[2], 'w+') +tabular = open(sys.argv[3], 'w+') + +for line in open(sys.argv[1]): + # Sequence 'CRISPRs' (10798 bp) + if line.startswith('Sequence '): + organism = line.split("'")[1] + # CRISPR 1 Range: 679197 - 682529 + if line.startswith('CRISPR '): + start,end = line.split('Range:')[1].strip().split('-') + start = start.strip() + end = end.strip() + bed.write('%s\t%s\t%s\n' % (organism, start, end)) + if line.rstrip().endswith(']'): + cols = line.split() + tabular.write("%s\t%s\t%s\t%s\t%s\t%s\n" % (organism, cols[0], cols[1], cols[2], cols[4].rstrip(','), cols[5]))