comparison UMI_riboseq_processing/UMI.py @ 1:5d0d5933d370 draft

Uploaded
author triasteran
date Sun, 19 Jun 2022 12:44:06 +0000
parents ef98c6fad2a2
children 6958515efa76
comparison
equal deleted inserted replaced
0:ef98c6fad2a2 1:5d0d5933d370
17 for lines in grouper(f, chunk_size, ""): #for every chunk_sized chunk 17 for lines in grouper(f, chunk_size, ""): #for every chunk_sized chunk
18 header = lines[0] 18 header = lines[0]
19 seq = lines[1] 19 seq = lines[1]
20 sep = lines[2] 20 sep = lines[2]
21 qual = lines[3] 21 qual = lines[3]
22 trimmed_seq = seq[2:-11]+seq[-6:-1]+"\n" # fooprint + barcode 22 trimmed_seq = seq[2:-5]+"\n" # fooprint + barcode
23 UMI = seq[0:2]+seq[-11:-6] #7nt in total 23 UMI = seq[0:2]+seq[-5:] #7nt in total; 5'NN and last 3'NNNNN
24 split_header = header.split(" ") 24 split_header = header.split(" ")
25 new_header = split_header[0]+"_"+UMI+" "+split_header[1] 25 new_header = split_header[0]+"_"+UMI+" "+split_header[1]
26 if qual[-1:] == "\n": 26 if qual[-1:] == "\n":
27 new_qual = qual[2:-11]+qual[-6:-1]+"\n" 27 new_qual = qual[2:-5]+"\n"
28 else: 28 else:
29 new_qual = qual[2:-10]+qual[-6:-1] 29 new_qual = qual[2:-5]
30 output.write(new_header) 30 output.write(new_header)
31 output.write(trimmed_seq) 31 output.write(trimmed_seq)
32 output.write(sep) 32 output.write(sep)
33 output.write(new_qual) 33 output.write(new_qual)
34 34