Mercurial > repos > davidvanzessen > shm_csr
comparison mutation_column_checker.py @ 81:b6f9a640e098 draft
Uploaded
author | davidvanzessen |
---|---|
date | Fri, 19 Feb 2021 15:10:54 +0000 |
parents | |
children | 729738462297 |
comparison
equal
deleted
inserted
replaced
80:a4617f1d1d89 | 81:b6f9a640e098 |
---|---|
1 import re | |
2 | |
3 mutationMatcher = re.compile("^([nactg])(\d+).([nactg]),?[ ]?([A-Z])?(\d+)?[>]?([A-Z;])?(.*)?") | |
4 | |
5 with open("7_V-REGION-mutation-and-AA-change-table.txt", 'r') as file_handle: | |
6 first = True | |
7 fr3_index = -1 | |
8 for i, line in enumerate(file_handle): | |
9 line_split = line.split("\t") | |
10 if first: | |
11 fr3_index = line_split.index("FR3-IMGT") | |
12 first = False | |
13 continue | |
14 | |
15 if len(line_split) < fr3_index: | |
16 continue | |
17 | |
18 fr3_data = line_split[fr3_index] | |
19 if len(fr3_data) > 5: | |
20 try: | |
21 test = [mutationMatcher.match(x).groups() for x in fr3_data.split("|") if x] | |
22 except: | |
23 print(line_split[1]) | |
24 print("Something went wrong at line {line} with:".format(line=line_split[0])) | |
25 #print([x for x in fr3_data.split("|") if not mutationMatcher.match(x)]) | |
26 if i % 100000 == 0: | |
27 print(i) |