Mercurial > repos > aaronpetkau > flash
comparison assembly_stats_txt.py @ 0:44c401ebc424 draft
Uploaded
author | aaronpetkau |
---|---|
date | Sat, 04 Jul 2015 08:57:35 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:44c401ebc424 |
---|---|
1 #!/usr/bin/env python | |
2 #Version 1.01 - bugs kindly corrected by Jan van Haarst | |
3 import pkg_resources | |
4 import logging, os, string, sys, tempfile, glob, shutil, types, urllib | |
5 import shlex, subprocess | |
6 from optparse import OptionParser, OptionGroup | |
7 from stat import * | |
8 | |
9 | |
10 log = logging.getLogger( __name__ ) | |
11 | |
12 assert sys.version_info[:2] >= ( 2, 4 ) | |
13 | |
14 def stop_err( msg ): | |
15 sys.stderr.write( "%s\n" % msg ) | |
16 sys.exit() | |
17 | |
18 def __main__(): | |
19 #Parse Command Line | |
20 s = 'assembly_stats_txt.py: argv = %s\n' % (sys.argv) | |
21 argcnt = len(sys.argv) | |
22 html_file = sys.argv[1] | |
23 working_dir = sys.argv[2] | |
24 type = sys.argv[3] | |
25 bucket = sys.argv[4] | |
26 input = sys.argv[5] | |
27 stats = sys.argv[6] | |
28 sortedcontigs = sys.argv[7] | |
29 histogrampng = sys.argv[8] | |
30 summedcontigspng = sys.argv[9] | |
31 histogramdata = sys.argv[10] | |
32 summedcontigdata = sys.argv[11] | |
33 try: # for test - needs this done | |
34 os.makedirs(working_dir) | |
35 except Exception, e: | |
36 stop_err( 'Error running assembly_stats_txt.py ' + str( e ) ) | |
37 | |
38 | |
39 cmdline = '%s/fasta_summary.pl -i %s -t %s %s -o %s > /dev/null' % (os.path.dirname(sys.argv[0]),input, type, bucket, working_dir) | |
40 try: | |
41 proc = subprocess.Popen( args=cmdline, shell=True, stderr=subprocess.PIPE ) | |
42 returncode = proc.wait() | |
43 # get stderr, allowing for case where it's very large | |
44 stderr = '' | |
45 buffsize = 1048576 | |
46 try: | |
47 while True: | |
48 stderr += proc.stderr.read( buffsize ) | |
49 if not stderr or len( stderr ) % buffsize != 0: | |
50 break | |
51 except OverflowError: | |
52 pass | |
53 if returncode != 0: | |
54 raise Exception, stderr | |
55 except Exception, e: | |
56 stop_err( 'Error running assembly_stats.py ' + str( e ) ) | |
57 | |
58 stats_path = os.path.join(working_dir,'stats.txt') | |
59 sorted_contigs_path = os.path.join(working_dir,'sorted_contigs.fa') | |
60 histogram_png_path = os.path.join(working_dir,'histogram_bins.dat.png') | |
61 summed_contigs_path = os.path.join(working_dir,'summed_contig_lengths.dat.png') | |
62 histogram_data_path = os.path.join(working_dir,'histogram_bins.dat') | |
63 summed_contigs_data_path = os.path.join(working_dir,'summed_contig_lengths.dat') | |
64 | |
65 out = open(stats,'w') | |
66 for line in open( stats_path ): | |
67 out.write( "%s" % (line) ) | |
68 out.close() | |
69 | |
70 out = open(sortedcontigs,'w') | |
71 for line in open(sorted_contigs_path ): | |
72 out.write( "%s" % (line) ) | |
73 out.close() | |
74 | |
75 out = open(histogrampng,'w') | |
76 for line in open(histogram_png_path ): | |
77 out.write( "%s" % (line) ) | |
78 out.close() | |
79 | |
80 out = open(summedcontigspng,'w') | |
81 for line in open(summed_contigs_path ): | |
82 out.write( "%s" % (line) ) | |
83 out.close() | |
84 | |
85 | |
86 out = open(histogramdata,'w') | |
87 for line in open(histogram_data_path ): | |
88 out.write( "%s" % (line) ) | |
89 out.close() | |
90 | |
91 out = open(summedcontigdata,'w') | |
92 for line in open(summed_contigs_data_path ): | |
93 out.write( "%s" % (line) ) | |
94 out.close() | |
95 | |
96 | |
97 | |
98 | |
99 | |
100 | |
101 | |
102 | |
103 | |
104 # rval = ['<html><head><title>Assembly stats Galaxy Composite Dataset </title></head><p/>'] | |
105 # rval.append('<div>%s<p/></div>' % (cmdline) ) | |
106 # rval.append('<div>This composite dataset is composed of the following files:<p/><ul>') | |
107 # rval.append( '<li><a href="%s" type="text/plain">%s </a>%s</li>' % (stats_path,'stats.txt','stats.txt' ) ) | |
108 # rval.append( '<li><a href="%s" type="text/plain">%s </a>%s</li>' % (sorted_contigs_path,'sorted_contigs.fa','sorted_contigs.fa' ) ) | |
109 # rval.append( '<li><a href="%s" type="image/png">%s </a>%s</li>' % (histogram_png_path,'histogram_bins.dat.png','histogram_bins.dat.png' ) ) | |
110 # rval.append( '<li><a href="%s" type="image/png">%s </a>%s</li>' % (summed_contigs_path,'summed_contig_lengths.dat.png','summed_contig_lengths.dat.png' ) ) | |
111 # rval.append( '<li><a href="%s" type="text/plain">%s </a>%s</li>' % (histogram_data_path,'histogram_bins.dat','histogram_bins.dat' ) ) | |
112 # rval.append( '<li><a href="%s" type="text/plain">%s </a>%s</li>' % (summed_contigs_data_path,'summed_contig_lengths.dat','summed_contig_lengths.dat' ) ) | |
113 | |
114 | |
115 # | |
116 # rval.append( '</ul></div></html>' ) | |
117 # f = file(html_file,'w') | |
118 # f.write("\n".join( rval )) | |
119 # f.write('\n') | |
120 # f.close() | |
121 | |
122 if __name__ == "__main__": __main__() |