Mercurial > repos > jay > pdaug_peptide_data_plotting
annotate PDAUG_TSVtoFASTA/PDAUG_TSVtoFASTA.py @ 3:f95354b0619f draft
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit edb37634e419f75dd66292e712de51278746d883"
| author | jay | 
|---|---|
| date | Wed, 30 Dec 2020 03:36:51 +0000 | 
| parents | f575cb9c9a67 | 
| children | 1335f334eb13 | 
| rev | line source | 
|---|---|
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
1 import os | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
2 import argparse | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
3 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
4 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
5 def TSVtoFASTA(InFile, Method, Positive, Negative, OutFile): | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
6 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
7 if Method == 'WithClassLabel': | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
8 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
9 f = open(InFile) | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
10 lines = f.readlines() | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
11 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
12 of1 = open(Positive,'w') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
13 of2 = open(Negative,'w') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
14 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
15 n = 0 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
16 m = 0 | 
| 
1
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
17 | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
18 l = [] | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
19 | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
20 for line in lines[1:]: | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
21 l.append(line.split('\t')[1].strip('\n').strip('\r')) | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
22 l = list(set(l)) | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
23 | 
| 
2
 
f575cb9c9a67
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 8b18552f6d2b2261efebe1075ff4c18a295b94dd"
 
jay 
parents: 
1 
diff
changeset
 | 
24 print(l) | 
| 
 
f575cb9c9a67
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 8b18552f6d2b2261efebe1075ff4c18a295b94dd"
 
jay 
parents: 
1 
diff
changeset
 | 
25 | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
26 for line in lines: | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
27 | 
| 
2
 
f575cb9c9a67
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 8b18552f6d2b2261efebe1075ff4c18a295b94dd"
 
jay 
parents: 
1 
diff
changeset
 | 
28 if l[1] in line.split('\t')[1].strip('\n').strip('\r'): | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
29 n= n+1 | 
| 
3
 
f95354b0619f
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit edb37634e419f75dd66292e712de51278746d883"
 
jay 
parents: 
2 
diff
changeset
 | 
30 of1.write('>peptide_'+str(n)+'_'+str(l[1])+'\n') | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
31 of1.write(line.split('\t')[0]+'\n') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
32 | 
| 
2
 
f575cb9c9a67
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 8b18552f6d2b2261efebe1075ff4c18a295b94dd"
 
jay 
parents: 
1 
diff
changeset
 | 
33 if l[0] in line.split('\t')[1].strip('\n').strip('\r'): | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
34 m= m+1 | 
| 
3
 
f95354b0619f
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit edb37634e419f75dd66292e712de51278746d883"
 
jay 
parents: 
2 
diff
changeset
 | 
35 of2.write('>peptide_'+str(m)+'_'+str(l[0])+'\n') | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
36 of2.write(line.split('\t')[0]+'\n') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
37 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
38 elif Method == 'NoClassLabel': | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
39 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
40 f = open(InFile) | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
41 lines = f.readlines() | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
42 of1 = open(OutFile,'w') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
43 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
44 for i, line in enumerate(lines[1:]): | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
45 of1.write('>peptide_'+str(i)+'\n') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
46 of1.write(line.split('\t')[0]+'\n') | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
47 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
48 else: | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
49 pass | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
50 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
51 if __name__=="__main__": | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
52 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
53 import argparse | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
54 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
55 parser = argparse.ArgumentParser() | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
56 | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
57 parser.add_argument("-I", "--InFile", required=True, default=None, help=".fasta or .tsv") | 
| 
1
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
58 parser.add_argument("-P", "--Postvs", required=False, default='FirstDataFile.fasta', help="Path to target tsv file") | 
| 
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
59 parser.add_argument("-N", "--Negtvs", required=False, default='SecondDataFile.fasta', help="Path to target tsv file") | 
| 
0
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
60 parser.add_argument("-O", "--OutFile", required=False, default='OutFile.fasta', help="Path to target tsv file") | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
61 parser.add_argument("-M", "--Method", required=True, default=None, help="Path to target tsv file") | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
62 args = parser.parse_args() | 
| 
 
9e347250e3a1
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit a9bd83f6a1afa6338cb6e4358b63ebff5bed155e"
 
jay 
parents:  
diff
changeset
 | 
63 | 
| 
1
 
f2f389b52376
"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 3c91f421d26c8f42cf2671e47db735d2cf69dde8"
 
jay 
parents: 
0 
diff
changeset
 | 
64 TSVtoFASTA(args.InFile, args.Method, args.Postvs, args.Negtvs, args.OutFile) | 
