annotate calc_fitness.py @ 2:ad553834b0ea draft

Uploaded
author kaymccoy
date Sun, 06 Nov 2016 21:06:52 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
1 # A translation of calc_fitness.pl into python! For analysis of Tn-Seq.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
2 # This script requires BioPython, which in turn has a good number of dependencies (some optional but very helpful).
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
3 # How to install BioPython and a list of its dependencies can be found here: http://biopython.org/DIST/docs/install/Installation.html
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
4 # K. McCoy
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
5
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
6
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
7
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
8
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
9
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
10
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
11
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
12
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
13
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
14 ##### ARGUMENTS #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
15
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
16 def print_usage():
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
17 print "\n" + "You are missing one or more required flags. A complete list of flags accepted by calc_fitness is as follows:" + "\n\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
18 print "\033[1m" + "Required" + "\033[0m" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
19 print "-ref" + "\t\t" + "The name of the reference genome file, in GenBank format." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
20 print "-t1" + "\t\t" + "The name of the bowtie mapfile from time 1." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
21 print "-t2" + "\t\t" + "The name of the bowtie mapfile from time 2." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
22 print "-out" + "\t\t" + "Name of a file to enter the .csv output." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
23 print "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
24 print "\033[1m" + "Optional" + "\033[0m" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
25 print "-expansion" + "\t\t" + "Expansion factor (default: 250)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
26 print "-reads1" + "\t\t" + "The number of reads to be used to calculate the correction factor for time 0." + "\n\t\t" + "(default counted from bowtie output)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
27 print "-reads2" + "\t\t" + "The number of reads to be used to calculate the correction factor for time 6." + "\n\t\t" + "(default counted from bowtie output)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
28 print "-cutoff" + "\t\t" + "Discard any positions where the average of counted transcripts at time 0 and time 1 is below this number (default 0)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
29 print "-cutoff2" + "\t\t" + "Discard any positions within the normalization genes where the average of counted transcripts at time 0 and time 1 is below this number (default 10)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
30 print "-strand" + "\t\t" + "Use only the specified strand (+ or -) when counting transcripts (default: both)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
31 print "-normalize" + "\t" + "A file that contains a list of genes that should have a fitness of 1 - used for normalization and bottleneck calculations." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
32 print "-b" + "\t" + "Calculate bottleneck value from all genes (rather than only normalization genes)" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
33 print "-maxweight" + "\t" + "The maximum weight a transposon gene can have in normalization calculations" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
34 print "-multiply" + "\t" + "Multiply all fitness scores by a certain value (e.g., the fitness of a knockout). You should normalize the data." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
35 print "-ef" + "\t\t" + "Exclude insertions that occur in the first N amount (%) of gene--becuase may not affect gene function." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
36 print "-el" + "\t\t" + "Exclude insertions in the last N amount (%) of the gene--considering truncation may not affect gene function." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
37 print "-wig" + "\t\t" + "Create a wiggle file for viewing in a genome browser. Provide a filename." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
38 print "-uncol" + "\t\t" + "Use if reads were uncollapsed when mapped." + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
39 print "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
40
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
41 import argparse
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
42 parser = argparse.ArgumentParser()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
43 parser.add_argument("-ref", action="store", dest="ref_genome")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
44 parser.add_argument("-t1", action="store", dest="mapfile1")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
45 parser.add_argument("-t2", action="store", dest="mapfile2")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
46 parser.add_argument("-out", action="store", dest="outfile")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
47 parser.add_argument("-out2", action="store", dest="outfile2")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
48 parser.add_argument("-expansion", action="store", dest="expansion_factor")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
49 parser.add_argument("-reads1", action="store", dest="reads1")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
50 parser.add_argument("-reads2", action="store", dest="reads2")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
51 parser.add_argument("-cutoff", action="store", dest="cutoff")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
52 parser.add_argument("-cutoff2", action="store", dest="cutoff2")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
53 parser.add_argument("-strand", action="store", dest="usestrand")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
54 parser.add_argument("-normalize", action="store", dest="normalize")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
55 parser.add_argument("-b", action="store", dest="bottleall")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
56 parser.add_argument("-maxweight", action="store", dest="max_weight")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
57 parser.add_argument("-multiply", action="store", dest="multiply")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
58 parser.add_argument("-ef", action="store", dest="exclude_first")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
59 parser.add_argument("-el", action="store", dest="exclude_last")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
60 parser.add_argument("-wig", action="store", dest="wig")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
61 parser.add_argument("-uncol", action="store", dest="uncol")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
62 arguments = parser.parse_args()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
63
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
64 if (not arguments.ref_genome or not arguments.mapfile1 or not arguments.mapfile2 or not arguments.outfile):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
65 print_usage()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
66 quit()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
67
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
68 # Sets the default value of the expansion factor to 250, which is a trivial placeholder number.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
69
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
70 if (not arguments.expansion_factor):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
71 arguments.expansion_factor = 250
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
72
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
73 # 75 is similarly trivial
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
74
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
75 if (not arguments.max_weight):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
76 arguments.max_weight = 75
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
77
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
78 # Sets the default value of cutoff to 0; cutoff exists to discard positions with a low number of counted transcripts, because fitnesses calculated from them may not be very accurate, by the same reasoning that studies with low sample sizes are innacurate.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
79
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
80 if (not arguments.cutoff):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
81 arguments.cutoff = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
82
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
83 # Sets the default value of cutoff2 to 10; cutoff2 exists to discard positions within normalization genes with a low number of counted transcripts, because fitnesses calculated from them similarly may not be very accurate.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
84 # This only has an effect if it's larger than cutoff, since the normalization step references a list of insertions already affected by cutoff.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
85
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
86 if (not arguments.cutoff2):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
87 arguments.cutoff2 = 10
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
88
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
89 if (not arguments.usestrand):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
90 arguments.usestrand = "both"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
91
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
92
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
93
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
94
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
95
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
96
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
97 ##### PARSING THE REFERENCE GENOME #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
98
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
99 def get_time():
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
100 import datetime
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
101 return datetime.datetime.now().time()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
102 print "\n" + "Starting: " + str(get_time()) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
103
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
104 from Bio import SeqIO
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
105 import os.path
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
106 handle = open(arguments.ref_genome, "rU")
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
107 for record in SeqIO.parse(handle, "genbank"):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
108 refname = record.id
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
109 features = record.features
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
110 handle.close()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
111
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
112 # Makes a dictionary out of each feature that's a gene - with its gene name, start location, end location, and strand as keys to their values. Then makes a list out of all those dictionaries for ease of accessing later on.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
113
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
114 feature_list = []
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
115 for feature in features:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
116 if feature.type == "gene":
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
117 gene = feature.qualifiers["locus_tag"]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
118 strand = feature.location.strand
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
119 start = float(feature.location.start)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
120 end = float(feature.location.end)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
121
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
122 # Exclude_first and exclude_last are used here to exclude whatever percentage of the genes you like from calculations; e.g. a value of 0.1 for exclude_last would exclude the last 10% of all genes!
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
123 # This can be useful because insertions at the very start or end of genes often don't actually break its function.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
124
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
125 if (arguments.exclude_first):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
126 start += (end - start) * float(arguments.exclude_first)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
127 if (arguments.exclude_last):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
128 end -= (end - start) * float(arguments.exclude_last)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
129 feature_dictionary = {"gene": gene, "start": start, "end": end, "strand": strand}
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
130 feature_list.append(feature_dictionary)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
131
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
132 print "Done generating feature lookup: " + str(get_time()) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
133
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
134
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
135
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
136
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
137
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
138
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
139
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
140
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
141
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
142
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
143 ##### PARSING THE MAPFILES #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
144
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
145 with open(arguments.mapfile1) as file:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
146 r1 = file.readlines()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
147 with open(arguments.mapfile2) as file:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
148 r2 = file.readlines()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
149
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
150 # When called, goes through each line of the mapfile to find the strand (+/Watson or -/Crick), count, and position of the read. It may be helpful to look at how the mapfiles are formatted to understand how this code finds them.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
151
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
152 def read_mapfile(reads):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
153 plus_total = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
154 minus_total = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
155 plus_counts = {"total": 0, "sites": 0}
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
156 minus_counts = {"total": 0, "sites": 0}
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
157 for read in reads:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
158 if (arguments.uncol):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
159 strand = read.split()[2]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
160 count = 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
161 position = float(read.split()[4])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
162 if arguments.usestrand != "both" and strand != arguments.usestrand:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
163 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
164 if (strand == "+"):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
165 sequence_length = len(read.split()[5])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
166 position += (sequence_length - 2)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
167 plus_counts["total"] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
168 plus_counts["sites"] += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
169 if position in plus_counts:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
170 plus_counts[position] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
171 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
172 plus_counts[position] = count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
173 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
174 minus_counts["total"] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
175 minus_counts["sites"] += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
176 if position in minus_counts:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
177 minus_counts[position] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
178 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
179 minus_counts[position] = count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
180 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
181 if "-" in read.split()[0]:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
182 strand = read.split()[1]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
183 count = float(read.split()[0].split("-")[1])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
184 position = float(read.split()[3])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
185 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
186 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
187
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
188 # If for some reason you want to skip all reads from one of the strands - for example, if you wanted to compare the two strands - that's done here.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
189
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
190 if arguments.usestrand != "both" and strand != arguments.usestrand:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
191 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
192
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
193 # Makes dictionaries for the + & - strands, with each insert position as a key and the number of insertions there as its corresponding value.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
194
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
195 if (strand == "+"):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
196 sequence_length = len(read.split()[4])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
197
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
198 # The -2 in "(sequence_length -2)" comes from a fake "TA" in the read; see how the libraries are constructed for further on this
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
199
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
200 position += (sequence_length - 2)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
201 plus_counts["total"] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
202 plus_counts["sites"] += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
203 if position in plus_counts:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
204 plus_counts[position] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
205 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
206 plus_counts[position] = count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
207 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
208 minus_counts["total"] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
209 minus_counts["sites"] += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
210 if position in minus_counts:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
211 minus_counts[position] += count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
212 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
213 minus_counts[position] = count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
214 return (plus_counts, minus_counts)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
215
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
216 # Calls read_mapfile(reads) to parse arguments.reads1 and arguments.reads2 (your reads from t1 and t2).
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
217
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
218
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
219
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
220
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
221
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
222 (plus_ref_1, minus_ref_1) = read_mapfile(r1)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
223 print "Read first file: " + str(get_time()) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
224 (plus_ref_2, minus_ref_2) = read_mapfile(r2)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
225 print "Read second file: " + str(get_time()) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
226
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
227 # The lines below are just printed for reference. The number of sites is the length of a given dictionary of sites - 1 because its last key, "total", isn't actually a site.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
228
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
229 print "Reads:" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
230 print "1: + " + str(plus_ref_1["total"]) + " - " + str(minus_ref_1["total"]) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
231 print "2: + " + str(plus_ref_2["total"]) + " - " + str(minus_ref_2["total"]) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
232 print "Sites:" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
233 print "1: + " + str(plus_ref_1["sites"]) + " - " + str(minus_ref_1["sites"]) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
234 print "2: + " + str(plus_ref_2["sites"]) + " - " + str(minus_ref_2["sites"]) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
235
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
236
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
237
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
238
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
239
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
240
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
241
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
242
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
243
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
244
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
245 ##### FITNESS CALCULATIONS #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
246
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
247 # If reads1 and reads2 weren't specified in the command line, sets them as the total number of reads (found in read_mapfile())
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
248
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
249 if not arguments.reads1:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
250 arguments.reads1 = plus_ref_1["total"] + minus_ref_1["total"]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
251 if not arguments.reads2:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
252 arguments.reads2 = plus_ref_2["total"] + minus_ref_2["total"]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
253
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
254 # Calculates the correction factors for reads from t1 and t2; cfactor1 and cfactor2 are the number of reads from t1 and t2 respectively divided by total, which is the average number of reads between the two.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
255 # This is used later on to correct for pipetting errors, or any other error that would cause unequal amounts of DNA from t1 and t2 to be sequenced so that an unequal amount of reads is produced
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
256
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
257 total = (float(arguments.reads1) + float(arguments.reads2))/2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
258 cfactor1 = float(arguments.reads1)/total
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
259 cfactor2 = float(arguments.reads2)/total
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
260 print "Cfactor 1: " + str(cfactor1) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
261 print "Cfactor 2: " + str(cfactor2) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
262 import math
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
263 import csv
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
264 results = [["position", "strand", "count_1", "count_2", "ratio", "mt_freq_t1", "mt_freq_t2", "pop_freq_t1", "pop_freq_t2", "gene", "D", "W", "nW"]]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
265 genic = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
266 total_inserts = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
267 with open(arguments.ref_genome, "r") as file:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
268 firstline = file.readline()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
269 genomelength = firstline.split()[2]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
270 i = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
271 while i < float(genomelength):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
272
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
273 # At each possible location for an insertion in the genome, counts the number of actual insertions at t1 and which strand(s) the corresponding reads came from.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
274
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
275 c1 = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
276 if i in plus_ref_1:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
277 c1 = float(plus_ref_1[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
278 strand = "+/"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
279 if i in minus_ref_1:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
280 c1 += float(minus_ref_1[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
281 strand = "b/"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
282 elif i in minus_ref_1:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
283 c1 = float(minus_ref_1[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
284 strand = "-/"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
285
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
286 # If there were no insertions at a certain location at t1 just continues to the next location; there can't be any comparison to make between t1 and t2 if there are no t1 insertions!
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
287
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
288 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
289 i += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
290 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
291
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
292 # At each location where there was an insertion at t1, counts the number of insertions at t2 and which strand(s) the corresponding reads came from.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
293
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
294 c2 = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
295 if i in plus_ref_2:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
296 c2 = float(plus_ref_2[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
297 if i in minus_ref_2:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
298 c2 += float(minus_ref_2[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
299 strand += "b"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
300 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
301 strand += "+"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
302 elif i in minus_ref_2:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
303 c2 = float(minus_ref_2[i])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
304 strand += "-"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
305
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
306 # Corrects with cfactor1 and cfactor2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
307
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
308 c1 /= cfactor1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
309 if c2 != 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
310 c2 /= cfactor2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
311 ratio = c2/c1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
312 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
313 c2 = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
314 ratio = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
315
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
316 # Passes by all insertions with a number of reads smaller than the cutoff, as they may lead to inaccurate fitness calculations.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
317
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
318 if (c1 + c2)/2 < float(arguments.cutoff):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
319 i+= 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
320 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
321
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
322 # Calculates each insertion's frequency within the populations at t1 and t2.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
323
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
324 mt_freq_t1 = c1/total
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
325 mt_freq_t2 = c2/total
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
326 pop_freq_t1 = 1 - mt_freq_t1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
327 pop_freq_t2 = 1 - mt_freq_t2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
328
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
329 # Calculates each insertion's fitness! This is from the fitness equation log((frequency of mutation @ time 2 / frequency of mutation @ time 1)*expansion factor)/log((frequency of population without the mutation @ time 2 / frequency of population without the mutation @ time 1)*expansion factor)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
330
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
331 w = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
332 if mt_freq_t2 != 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
333 top_w = math.log(mt_freq_t2*(float(arguments.expansion_factor)/mt_freq_t1))
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
334 bot_w = math.log(pop_freq_t2*(float(arguments.expansion_factor)/pop_freq_t1))
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
335 w = top_w/bot_w
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
336
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
337 # Checks which gene locus the insertion falls within, and records that.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
338
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
339 gene = ''
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
340 for feature_dictionary in feature_list:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
341 if feature_dictionary["start"] <= i and feature_dictionary["end"] >= i:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
342 gene = "".join(feature_dictionary["gene"])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
343 genic += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
344 break
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
345 total_inserts += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
346
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
347 # Writes all relevant information on each insertion and its fitness to a cvs file: the location of the insertion, its strand, c1, c2, etc. (the variable names are self-explanatiory)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
348 # w is written twice, because the second w will be normalized if normalization is called for, thus becoming nW.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
349
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
350 row = [i, strand, c1, c2, ratio, mt_freq_t1, mt_freq_t2, pop_freq_t1, pop_freq_t2, gene, arguments.expansion_factor, w, w]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
351 results.append(row)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
352 i += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
353 with open(arguments.outfile, "wb") as csvfile:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
354 writer = csv.writer(csvfile)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
355 writer.writerows(results)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
356
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
357 print "Done comparing mapfiles " + str(get_time()) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
358 print "Genic: " + str(genic) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
359 print "Total: " + str(total_inserts) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
360
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
361
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
362
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
363
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
364
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
365
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
366
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
367
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
368
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
369
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
370 ##### BOTTLENECK VALUE CALCULATION #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
371
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
372 #the bottleneck value is calculated here if done from all genes - otherwise it's done in the normalization section if only taken from normalization genes
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
373
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
374 if (arguments.bottleall):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
375 for list in results:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
376 if list[11] == 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
377 overall_blank_count += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
378 overall_original_count = len(results)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
379
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
380 pc_blank_normals = float(overall_blank_count) / float(overall_original_count)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
381
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
382 with open(arguments.outfile2, "w") as f:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
383 f.write("bottleneck_value: " + str(pc_blank_normals) + "\n" + "total: " + str(total) + "\n" + "refname: " + refname)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
384
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
385
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
386
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
387
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
388
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
389
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
390
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
391
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
392
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
393
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
394 ##### NORMALIZATION #####
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
395
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
396 # If making a WIG file is requested in the arguments, starts a string to be added to and then written to the WIG file with a typical WIG file header.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
397 # The header is just in a typical WIG file format; if you'd like to look into this more UCSC has notes on formatting WIG files on their site.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
398
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
399 if (arguments.wig):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
400 wigstring = "track type=wiggle_0 name=" + arguments.wig + "\n" + "variableStep chrom=" + refname + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
401
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
402 # Takes normalization genes (which should all be predicted or known to have fitness values of exactly 1.0, like transposons for example) and uses them to normalize the fitnesses of all insertion locations
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
403
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
404 if (arguments.normalize):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
405 with open(arguments.normalize) as file:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
406 transposon_genes = file.read().splitlines()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
407 print "Normalize genes loaded" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
408 blank_ws = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
409 sum = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
410 count = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
411 weights = []
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
412 scores = []
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
413 for list in results:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
414 if list[9] != '' and list[9] in transposon_genes:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
415 c1 = list[2]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
416 c2 = list[3]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
417 score = list[11]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
418 avg = (c1 + c2)/2
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
419
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
420 # Skips over those insertion locations with too few insertions - their fitness values are less accurate because they're based on such small insertion numbers.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
421
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
422 if float(c1) >= float(arguments.cutoff2):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
423
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
424 # Sets a max weight, to prevent insertion location scores with huge weights from unbalancing the normalization.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
425
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
426 if (avg >= float(arguments.max_weight)):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
427 avg = float(arguments.max_weight)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
428
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
429 # Tallies how many w values are 0 within the blank_ws value; you might get many transposon genes with a w value of 0 if a bottleneck occurs, for example, which is especially common with in vivo experiments. This is used later by aggregate.py
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
430 # For example, when studying a nasal infection in a mouse model, what bacteria "sticks" and is able to survive and what bacteria is swallowed and killed or otherwise flushed out tends to be a matter of chance not fitness; all mutants with an insertion in a specific transposon gene could be flushed out by chance!
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
431
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
432 if score == 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
433 blank_ws += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
434
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
435 sum += score
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
436 count += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
437 weights.append(avg)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
438 scores.append(score)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
439
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
440 print str(list[9]) + " " + str(score) + " " + str(c1)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
441
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
442 # Counts and removes all "blank" fitness values of normalization genes - those that = 0 - because they most likely don't really have a fitness value of 0, and you just happened to not get any reads from that location at t2.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
443
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
444 blank_count = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
445 original_count = len(scores)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
446 curr_count = original_count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
447 i = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
448 while i < curr_count:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
449 w_value = scores[i]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
450 if w_value == 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
451 blank_count += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
452 weights.pop(i)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
453 scores.pop(i)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
454 i -= 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
455 curr_count = len(scores)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
456 i += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
457
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
458 # If no normalization genes can pass the cutoff, normalization cannot occur, so this ends the script advises the user to try again and lower cutoff and/or cutoff2.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
459
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
460 if len(scores) == 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
461 print 'ERROR: The normalization genes do not have enough reads to pass cutoff and/or cutoff2; please lower one or both of those arguments.' + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
462 quit()
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
463
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
464 pc_blank_normals = float(blank_countv) / float(original_count)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
465 print "# blank out of " + str(original_count) + ": " + str(pc_blank_normals) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
466 if (!arguments.bottleall):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
467 with open(arguments.outfile2, "w") as f:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
468 f.write("bottleneck_value: " + str(pc_blank_normals) + "\n" + "total: " + str(total) + "\n" + "refname: " + refname)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
469
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
470 average = sum / count
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
471 i = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
472 weighted_sum = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
473 weight_sum = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
474 while i < len(weights):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
475 weighted_sum += weights[i]*scores[i]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
476 weight_sum += weights[i]
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
477 i += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
478 weighted_average = weighted_sum/weight_sum
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
479
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
480 print "Normalization step:" + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
481 print "Regular average: " + str(average) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
482 print "Weighted Average: " + str(weighted_average) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
483 print "Total Insertions: " + str(count) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
484
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
485 old_ws = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
486 new_ws = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
487 wcount = 0
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
488
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
489 for list in results:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
490 if list[11] == 'W':
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
491 continue
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
492 new_w = float(list[11])/weighted_average
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
493
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
494 # Sometimes you want to multiply all the fitness values by a constant; this does that.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
495 # For example you might multiply all the values by a constant for a genetic interaction screen - where Tn-Seq is performed as usual except there's one background knockout all the mutants share.
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
496
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
497 if arguments.multiply:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
498 new_w *= float(arguments.multiply)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
499
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
500 if float(list[11]) > 0:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
501 old_ws += float(list[11])
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
502 new_ws += new_w
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
503 wcount += 1
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
504
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
505 list[12] = new_w
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
506
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
507 if (arguments.wig):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
508 wigstring += str(list[0]) + " " + str(new_w) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
509
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
510 old_w_mean = old_ws / wcount
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
511 new_w_mean = new_ws / wcount
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
512 print "Old W Average: " + str(old_w_mean) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
513 print "New W Average: " + str(new_w_mean) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
514
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
515 with open(arguments.outfile, "wb") as csvfile:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
516 writer = csv.writer(csvfile)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
517 writer.writerows(results)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
518
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
519 if (arguments.wig):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
520 if (arguments.normalize):
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
521 with open(arguments.wig, "wb") as wigfile:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
522 wigfile.write(wigstring)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
523 else:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
524 for list in results:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
525 wigstring += str(list[0]) + " " + str(list[11]) + "\n"
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
526 with open(arguments.wig, "wb") as wigfile:
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
527 wigfile.write(wigstring)
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
528
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
529
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
530
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
531
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
532
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
533
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
534
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
535
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
536
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
537
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
538
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
539
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
540
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
541
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
542
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
543
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
544
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
545
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
546
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
547
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
548
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
549
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
550
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
551
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
552
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
553
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
554
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
555
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
556
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
557
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
558
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
559
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
560
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
561
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
562
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
563
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
564
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
565
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
566
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
567
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
568
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
569
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
570
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
571
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
572
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
573
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
574
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
575
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
576
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
577
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
578
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
579
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
580
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
581
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
582
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
583
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
584
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
585
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
586
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
587
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
588
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
589
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
590
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
591
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
592
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
593
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
594
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
595
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
596
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
597
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
598
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
599
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
600
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
601
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
602
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
603
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
604
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
605
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
606
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
607
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
608
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
609
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
610
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
611
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
612
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
613
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
614
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
615
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
616
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
617
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
618
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
619
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
620
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
621
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
622
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
623
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
624
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
625
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
626
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
627
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
628
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
629 # `````````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
630 # `````````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
631 # ``@@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
632 # ``@@@@@@@@@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
633 # ``@@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
634 # ``@@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
635 # ``@@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
636 # ``@@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
637 # ```@@@@@@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
638 # ```@@@@@@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
639 # ```@@@@@@@@+``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
640 # ```@@@@@@@@'``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
641 # ```@@@@@@@@;``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
642 # ```@@@@@@@@;``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
643 # ```@@@@@@@@:``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
644 # ```@@@@@@@@,``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
645 # ``.@@@@@@@@.``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
646 # ``.@@@@@@@@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
647 # ``.@@@@@@@@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
648 # ``.@@@@@@@@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
649 # ``.@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
650 # ``,@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
651 # ``,@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
652 # ``.@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
653 # ```@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
654 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
655 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
656 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
657 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
658 # ``'@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
659 # ``;@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
660 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
661 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
662 # ``:@@@@@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
663 # ``;@@@@@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
664 # ````+@@@@@@@#`````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
665 # ```````#@@@@@@@#``````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
666 # `````.,@@@@@@@@@...````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
667 # ``@@@@@@@@@@@@@@@@@@;``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
668 # ``@@@@@@@@@@@@@@@@@@;``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
669 # ```````````````````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
670 # `````````````````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
671 # ``````.```````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
672 # ````@.''```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
673 # ```# `;```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
674 # ``.+ @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
675 # ```@ ````,+```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
676 # ```;;````` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
677 # ```@ ``````,@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
678 # ```,+```..```@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
679 # ```@ ``....```@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
680 # ```+' ``....```#'``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
681 # ```@```......`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
682 # ```'+```......```'@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
683 # ```@ ``........```@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
684 # ```'#```........````@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
685 # ```@ ``..........```#,``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
686 # ```'#```...........`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
687 # ```@``.............```.+```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
688 # ```:#```.............`` #```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
689 # ``````` ```@ ```.......#......``.@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
690 # `````````` ```:@```#`......@......```@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
691 # ``````#@@@`` ```@ `.`:.......@.......`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
692 # ```.#@###@`` ```:@``..`+`....`@.......```@,``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
693 # ```'@####@``` ```@````..@@@@@@@@#,`..#```` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
694 # ```#####@@``` ``;@ ,`.,@@. `@@..#..```''``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
695 # ``:####@#```` ```@``@`@@ @@:...`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
696 # ```@#####```` ``,@``.@, ,@`...``:@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
697 # ``.####@``` ```@.` @` @....``@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
698 # ``####@``` ``,@ @.` @`.````@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
699 # ``@##@```` ```@, @: ;# `@..```@.``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
700 # ```@##```` ``.@`,@ @@, #...`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
701 # ```@#@``` ```@, # `@@@ @`.```;'``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
702 # ```##:`` ``.@ +, .@@@ ,'..`` @```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
703 # ``.##``` ```@, @ `@@@ @`.```,+```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
704 # `````@##``` ```@`'. @@@ :...```@``` ``````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
705 # ````````````````````````````````````````##@``` ```@:`@ @@@ #...`` #``` `````````````````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
706 # ```````````````````````````````````````.###@``` ```@ `, .@@@++'++#@@'` #`..```#``` ````````````'@@@@@.````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
707 # `````+@####################@@@@@@@@@@@@#####@``` ```#;`,. `@#...,.,,,,,,..;@, @....`` @``````````````+@@@########@.``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
708 # `+@##########################################,```` ```````````````@```@ +@,.,,,,,,,,,,,,,,,,,@ @....```#`````````'@@@##############@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
709 # `@###########################################@``````````````````````````````````````+'``.,'.#.,,,,,,,,,,,,,,,,,,,,.++@......`` @````+@@@#######@+``````'###'``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
710 # ``:@@########@@@@@@@@@@@@@@@@@@@@@@#@@@@@@@##@``````````````````````````......,`,,.,@ ```.##.,.,,,,,,,,,,,,,,,,,,,,.##......`` :.+@@#######@@:``````````###@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
711 # ````````````````````````````````,#########@###@@@@#################################@'```...@.,,,,,,,,,,,,,,,,,,,,,,,#.........`'@######@@+```````````````@##```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
712 # ```````````````````````````````@#########@#########################################```.....@:,,,,,,,,,,,,,,,,,,..;@..........`@####@@:```````` ```@##@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
713 # `````@@####@@@##########@@@@@@@@@@@@@@@@@@@@@@@@@@@@#+@+```......@#.,,,,,,,,,,,,,,,,.##..........`` #@#````````` ```##@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
714 # ``.#@######@####:```````````````````````````````````@ ``.......@:#,,,,,,,,,,,,,,,;@@`............`` @`````` ```@##:``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
715 # ``:########@###@```````````````````````````````````#;```......+..`##,.,,,,,,,,.#@#..'............`` @```` ``;##@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
716 # ```@@####@@##@'```` ````@ ``.......'.....@@#+;:;'#@@;`...#`............`` @``` ```@##```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
717 # ```````````````` ```@,```.............'..:''':.@`......:............```@.`` ``@###```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
718 # `````````````` ``.@```..............#........'`....................```@``` ``.##@``````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
719 # ```@.``..............`#........,.....................```@.`` ```@#+,``````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
720 # ``.@``.,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,.................```@``` ````+#####@````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
721 # ```@````......,........................,....,,.,.,,,,,..` @,`` ```;@@######````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
722 # ``.@```.......,......................`......,...........```@``` ```+#########@````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
723 # ```@```...........`@@+...............+@@`....,...........```@:`` ``;@#########@'```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
724 # ``.@ ``............@@@@@`.........,@@@@@.....,............```@``` ``@#########@#@@```
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
725 # ```@.```............@@@@@@@`.....'@@@@@@@.....,............```#'`` ``@###@###@#@#@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
726 # ``.@```.............@@@@@@@@@..+#@@@@@@@@.....,.............`` #``` ``@#@@@@##@#@#@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
727 # ```@````.............@@@@@@@@@@@@@@@@@@@@@.....,.............```'#``` ``'#@@@@##@#@@@@@,`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
728 # ``.@ ``.........,....@@@@@@@@@',##@@@@@@@@`....,..............```@``` ```@@@@@##@@'#@@@@`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
729 # ```@.```.........,....@@@@@@@#`...`#@@@@@@@`....,..............```.@``` ``#@@@@##;```@@@@`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
730 # ``.@ ``.....,,,,,,,.,.@@@@@#.,,,,,,,.#@@@@@,,,,,,,,,,,,:,,,,,,,,.``@``` ``#@@@@#.````@@@@`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
731 # ```@. ``...............@@@;......,......#@@@`...........,.........```@``` ``#@@@;``````@@@@`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
732 # ```@```................@,........,........+#`...........,.........```@.`` ``#@@@;``````@@@@`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
733 # ```@.``...........................,.........`............,..........```@``` ``#@@@'`` ``#@@;`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
734 # ``.@ ``................,..........,......................,..........```#:`` ``#@@@'`` ```#@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
735 # ```@,``............................,......................,...........`` @``` ``+@@@'`` `````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
736 # ``.@```............................,......................,...........```#+`` ``;@@@+`` ``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
737 # ```@,``.............................,......................,............```@``` ``'@@@+``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
738 # ``.@```.........,...................,......................,............```'#``` ``;@@@+``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
739 # ```@:```.........,...................,......................,.............`` @``` ``:@@@+``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
740 # ```@`..,,,,,,,,,,,,,,,,,,..,.........,......................,.............```'@``` ``;@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
741 # ``+'```...,.................,....,,,,,,,,,,,,,,,,,,,,,,,,,,,,,..........,...``@``` ``;@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
742 # ```@ ``....,.................,.......................................,.......``;@``` ``:@@@#``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
743 # ``'#```....,.................,.......................................,.......```@``` ``:@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
744 # ```@```.....,.................,.......................................,........``;#`` ``:@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
745 # ```@ ``.....,.................,.......................................,........`` @``` ``:@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
746 # ``@````...............................................................,........`` @.`` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
747 # ``@ ```..............................................................,........`` .#`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
748 # ``# ``````.`.```````````````..````````````````````..`````````````````.`````````` @`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
749 # ``. `````````````````````````````````````````````````````````````````````````` .;`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
750 # ``@;` `` ` ` ` ` ```` ` ````` ` ` `,+@``` ``+@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
751 # `````:;'++##@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@+.```` ``+@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
752 # ```````````````````````````+##@``````````````````@#@``````````````````````````````` ``+@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
753 # `````````````````````````@##@``````````````````@##;```````````````````````````` ``+@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
754 # ````###,```` ````+##@``` ``+@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
755 # ``,###``` ``.@##``` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
756 # ``###@`` ```@##``` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
757 # ```@##@`` ``@##+`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
758 # ```###.`` ``:##@`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
759 # ``:###``` ```##@``` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
760 # ``@##@`` ```@##``` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
761 # ```@##'`` ``@###`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
762 # ```@##``` ```##@`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
763 # ``,###``` ```@#@``` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
764 # ``####`` ``@##.`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
765 # ``@##@`` ``;##@`` ``'@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
766 # `````````@##@`` ```##@```` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
767 # ``````````````@##;`` ```###`````````````` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
768 # `````````.,;.```###``` ``@##:`````````````` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
769 # `````#@#########@@##``` ``###@@@@@@###@#@'``` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
770 # ```@@###############@`` ``,################`` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
771 # ``'@################+`` ```###############+`` ``;@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
772 # `````````````````````` ``###########@#,```` ``.@@@@``
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
773 # ````````````````````` ``````````````````` ```@@@.`
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
774 # ```````````````` ```````
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
775 #
ad553834b0ea Uploaded
kaymccoy
parents:
diff changeset
776 #