annotate rnafold_SHAPE.py @ 2:f3384a8b45a2 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
author rnateam
date Tue, 16 May 2017 16:29:38 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
1 ### overcoming the problem of SHAPE data working with a single line.
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
2 ### creating multiple multiple files containg SHAPE data for a single sequence and running RNAfold for every
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
3 ### single sequence.
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
4
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
5 import os
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
6 import sys
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
7 from os import system
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
8 from Bio import SeqIO
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
9 import re
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
10 from subprocess import Popen, PIPE
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
11
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
12 params_list = sys.argv[1:]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
13 param_list_no_shape = [s for s in params_list if not "--shape=" in s ]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
14 shape_file = [s for s in params_list if "--shape=" in s ]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
15 assert (len(shape_file) == 1)
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
16
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
17 shape_file = shape_file[0]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
18 shape_file = shape_file.replace('--shape=', '')
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
19
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
20 params_no_shape = " ".join(str(x) for x in param_list_no_shape)
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
21
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
22 pattern = re.compile("^>.*$")
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
23 id_line = ""
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
24 with open(shape_file, 'r') as f:
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
25 content = f.read()
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
26 lines = content.split('\n')
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
27 for line in lines:
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
28 if pattern.match(line):
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
29 id_line = line.split()[0]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
30 id_line = id_line[1:]
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
31 continue
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
32 else:
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
33 with open(id_line +'.tmp', "a") as clFile:
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
34 clFile.write(line + "\n")
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
35
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
36 input_file = sys.stdin
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
37
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
38 for record in SeqIO.parse(input_file, "fasta"):
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
39 seq = ">{}\n{}".format(record.id,record.seq)
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
40 cmd = " RNAfold --shape=" + record.id + '.tmp ' + params_no_shape
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
41 p = Popen(cmd , stdin=PIPE, shell=True, stdout=PIPE, stderr=PIPE)
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
42 out,err = p.communicate(seq.encode())
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
43 if err:
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
44 raise RuntimeError("Error in calling RNAfold\n{}\n{}\n".format(out, err))
f3384a8b45a2 planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/vienna_rna commit b'bd13ffd1c3e126a6dc59dd3c478347ec1b5824a3\n'
rnateam
parents:
diff changeset
45 print (out.decode('utf-8').strip())