annotate calc_fitness.py @ 11:1bc740b6462d draft default tip

Uploaded
author kaymccoy
date Sun, 06 Nov 2016 20:31:32 -0500
parents 369ad02454d8
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
10
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
1 # A translation of calc_fitness.pl into python! For analysis of Tn-Seq.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
2 # This script requires BioPython, which in turn has a good number of dependencies (some optional but very helpful).
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
3 # How to install BioPython and a list of its dependencies can be found here: http://biopython.org/DIST/docs/install/Installation.html
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
4 # K. McCoy
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
5
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
6
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
7
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
8
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
9
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
10
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
11
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
12
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
13
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
14 ##### ARGUMENTS #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
15
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
16 def print_usage():
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
17 print "\n" + "You are missing one or more required flags. A complete list of flags accepted by calc_fitness is as follows:" + "\n\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
18 print "\033[1m" + "Required" + "\033[0m" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
19 print "-ref" + "\t\t" + "The name of the reference genome file, in GenBank format." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
20 print "-t1" + "\t\t" + "The name of the bowtie mapfile from time 1." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
21 print "-t2" + "\t\t" + "The name of the bowtie mapfile from time 2." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
22 print "-out" + "\t\t" + "Name of a file to enter the .csv output." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
23 print "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
24 print "\033[1m" + "Optional" + "\033[0m" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
25 print "-expansion" + "\t\t" + "Expansion factor (default: 250)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
26 print "-reads1" + "\t\t" + "The number of reads to be used to calculate the correction factor for time 0." + "\n\t\t" + "(default counted from bowtie output)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
27 print "-reads2" + "\t\t" + "The number of reads to be used to calculate the correction factor for time 6." + "\n\t\t" + "(default counted from bowtie output)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
28 print "-cutoff" + "\t\t" + "Discard any positions where the average of counted transcripts at time 0 and time 1 is below this number (default 0)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
29 print "-cutoff2" + "\t\t" + "Discard any positions within the normalization genes where the average of counted transcripts at time 0 and time 1 is below this number (default 10)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
30 print "-strand" + "\t\t" + "Use only the specified strand (+ or -) when counting transcripts (default: both)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
31 print "-normalize" + "\t" + "A file that contains a list of genes that should have a fitness of 1 - used for normalization and bottleneck calculations." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
32 print "-b" + "\t" + "Calculate bottleneck value from all genes (rather than only normalization genes)" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
33 print "-maxweight" + "\t" + "The maximum weight a transposon gene can have in normalization calculations" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
34 print "-multiply" + "\t" + "Multiply all fitness scores by a certain value (e.g., the fitness of a knockout). You should normalize the data." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
35 print "-ef" + "\t\t" + "Exclude insertions that occur in the first N amount (%) of gene--becuase may not affect gene function." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
36 print "-el" + "\t\t" + "Exclude insertions in the last N amount (%) of the gene--considering truncation may not affect gene function." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
37 print "-wig" + "\t\t" + "Create a wiggle file for viewing in a genome browser. Provide a filename." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
38 print "-uncol" + "\t\t" + "Use if reads were uncollapsed when mapped." + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
39 print "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
40
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
41 import argparse
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
42 parser = argparse.ArgumentParser()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
43 parser.add_argument("-ref", action="store", dest="ref_genome")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
44 parser.add_argument("-t1", action="store", dest="mapfile1")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
45 parser.add_argument("-t2", action="store", dest="mapfile2")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
46 parser.add_argument("-out", action="store", dest="outfile")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
47 parser.add_argument("-out2", action="store", dest="outfile2")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
48 parser.add_argument("-expansion", action="store", dest="expansion_factor")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
49 parser.add_argument("-reads1", action="store", dest="reads1")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
50 parser.add_argument("-reads2", action="store", dest="reads2")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
51 parser.add_argument("-cutoff", action="store", dest="cutoff")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
52 parser.add_argument("-cutoff2", action="store", dest="cutoff2")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
53 parser.add_argument("-strand", action="store", dest="usestrand")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
54 parser.add_argument("-normalize", action="store", dest="normalize")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
55 parser.add_argument("-b", action="store", dest="bottleall")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
56 parser.add_argument("-maxweight", action="store", dest="max_weight")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
57 parser.add_argument("-multiply", action="store", dest="multiply")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
58 parser.add_argument("-ef", action="store", dest="exclude_first")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
59 parser.add_argument("-el", action="store", dest="exclude_last")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
60 parser.add_argument("-wig", action="store", dest="wig")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
61 parser.add_argument("-uncol", action="store", dest="uncol")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
62 arguments = parser.parse_args()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
63
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
64 if (not arguments.ref_genome or not arguments.mapfile1 or not arguments.mapfile2 or not arguments.outfile):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
65 print_usage()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
66 quit()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
67
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
68 # Sets the default value of the expansion factor to 250, which is a trivial placeholder number.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
69
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
70 if (not arguments.expansion_factor):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
71 arguments.expansion_factor = 250
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
72
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
73 # 75 is similarly trivial
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
74
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
75 if (not arguments.max_weight):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
76 arguments.max_weight = 75
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
77
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
78 # Sets the default value of cutoff to 0; cutoff exists to discard positions with a low number of counted transcripts, because fitnesses calculated from them may not be very accurate, by the same reasoning that studies with low sample sizes are innacurate.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
79
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
80 if (not arguments.cutoff):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
81 arguments.cutoff = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
82
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
83 # Sets the default value of cutoff2 to 10; cutoff2 exists to discard positions within normalization genes with a low number of counted transcripts, because fitnesses calculated from them similarly may not be very accurate.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
84 # This only has an effect if it's larger than cutoff, since the normalization step references a list of insertions already affected by cutoff.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
85
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
86 if (not arguments.cutoff2):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
87 arguments.cutoff2 = 10
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
88
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
89 if (not arguments.usestrand):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
90 arguments.usestrand = "both"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
91
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
92
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
93
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
94
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
95
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
96
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
97 ##### PARSING THE REFERENCE GENOME #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
98
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
99 def get_time():
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
100 import datetime
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
101 return datetime.datetime.now().time()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
102 print "\n" + "Starting: " + str(get_time()) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
103
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
104 from Bio import SeqIO
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
105 import os.path
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
106 handle = open(arguments.ref_genome, "rU")
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
107 for record in SeqIO.parse(handle, "genbank"):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
108 refname = record.id
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
109 features = record.features
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
110 handle.close()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
111
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
112 # Makes a dictionary out of each feature that's a gene - with its gene name, start location, end location, and strand as keys to their values. Then makes a list out of all those dictionaries for ease of accessing later on.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
113
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
114 feature_list = []
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
115 for feature in features:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
116 if feature.type == "gene":
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
117 gene = feature.qualifiers["locus_tag"]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
118 strand = feature.location.strand
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
119 start = float(feature.location.start)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
120 end = float(feature.location.end)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
121
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
122 # Exclude_first and exclude_last are used here to exclude whatever percentage of the genes you like from calculations; e.g. a value of 0.1 for exclude_last would exclude the last 10% of all genes!
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
123 # This can be useful because insertions at the very start or end of genes often don't actually break its function.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
124
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
125 if (arguments.exclude_first):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
126 start += (end - start) * float(arguments.exclude_first)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
127 if (arguments.exclude_last):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
128 end -= (end - start) * float(arguments.exclude_last)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
129 feature_dictionary = {"gene": gene, "start": start, "end": end, "strand": strand}
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
130 feature_list.append(feature_dictionary)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
131
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
132 print "Done generating feature lookup: " + str(get_time()) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
133
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
134
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
135
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
136
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
137
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
138
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
139
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
140
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
141
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
142
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
143 ##### PARSING THE MAPFILES #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
144
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
145 with open(arguments.mapfile1) as file:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
146 r1 = file.readlines()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
147 with open(arguments.mapfile2) as file:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
148 r2 = file.readlines()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
149
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
150 # When called, goes through each line of the mapfile to find the strand (+/Watson or -/Crick), count, and position of the read. It may be helpful to look at how the mapfiles are formatted to understand how this code finds them.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
151
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
152 def read_mapfile(reads):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
153 plus_total = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
154 minus_total = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
155 plus_counts = {"total": 0, "sites": 0}
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
156 minus_counts = {"total": 0, "sites": 0}
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
157 for read in reads:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
158 if (arguments.uncol):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
159 strand = read.split()[2]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
160 count = 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
161 position = float(read.split()[4])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
162 if arguments.usestrand != "both" and strand != arguments.usestrand:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
163 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
164 if (strand == "+"):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
165 sequence_length = len(read.split()[5])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
166 position += (sequence_length - 2)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
167 plus_counts["total"] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
168 plus_counts["sites"] += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
169 if position in plus_counts:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
170 plus_counts[position] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
171 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
172 plus_counts[position] = count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
173 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
174 minus_counts["total"] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
175 minus_counts["sites"] += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
176 if position in minus_counts:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
177 minus_counts[position] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
178 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
179 minus_counts[position] = count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
180 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
181 if "-" in read.split()[0]:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
182 strand = read.split()[1]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
183 count = float(read.split()[0].split("-")[1])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
184 position = float(read.split()[3])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
185 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
186 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
187
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
188 # If for some reason you want to skip all reads from one of the strands - for example, if you wanted to compare the two strands - that's done here.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
189
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
190 if arguments.usestrand != "both" and strand != arguments.usestrand:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
191 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
192
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
193 # Makes dictionaries for the + & - strands, with each insert position as a key and the number of insertions there as its corresponding value.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
194
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
195 if (strand == "+"):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
196 sequence_length = len(read.split()[4])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
197
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
198 # The -2 in "(sequence_length -2)" comes from a fake "TA" in the read; see how the libraries are constructed for further on this
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
199
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
200 position += (sequence_length - 2)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
201 plus_counts["total"] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
202 plus_counts["sites"] += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
203 if position in plus_counts:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
204 plus_counts[position] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
205 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
206 plus_counts[position] = count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
207 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
208 minus_counts["total"] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
209 minus_counts["sites"] += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
210 if position in minus_counts:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
211 minus_counts[position] += count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
212 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
213 minus_counts[position] = count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
214 return (plus_counts, minus_counts)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
215
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
216 # Calls read_mapfile(reads) to parse arguments.reads1 and arguments.reads2 (your reads from t1 and t2).
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
217
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
218
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
219
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
220
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
221
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
222 (plus_ref_1, minus_ref_1) = read_mapfile(r1)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
223 print "Read first file: " + str(get_time()) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
224 (plus_ref_2, minus_ref_2) = read_mapfile(r2)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
225 print "Read second file: " + str(get_time()) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
226
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
227 # The lines below are just printed for reference. The number of sites is the length of a given dictionary of sites - 1 because its last key, "total", isn't actually a site.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
228
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
229 print "Reads:" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
230 print "1: + " + str(plus_ref_1["total"]) + " - " + str(minus_ref_1["total"]) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
231 print "2: + " + str(plus_ref_2["total"]) + " - " + str(minus_ref_2["total"]) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
232 print "Sites:" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
233 print "1: + " + str(plus_ref_1["sites"]) + " - " + str(minus_ref_1["sites"]) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
234 print "2: + " + str(plus_ref_2["sites"]) + " - " + str(minus_ref_2["sites"]) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
235
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
236
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
237
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
238
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
239
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
240
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
241
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
242
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
243
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
244
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
245 ##### FITNESS CALCULATIONS #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
246
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
247 # If reads1 and reads2 weren't specified in the command line, sets them as the total number of reads (found in read_mapfile())
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
248
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
249 if not arguments.reads1:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
250 arguments.reads1 = plus_ref_1["total"] + minus_ref_1["total"]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
251 if not arguments.reads2:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
252 arguments.reads2 = plus_ref_2["total"] + minus_ref_2["total"]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
253
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
254 # Calculates the correction factors for reads from t1 and t2; cfactor1 and cfactor2 are the number of reads from t1 and t2 respectively divided by total, which is the average number of reads between the two.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
255 # This is used later on to correct for pipetting errors, or any other error that would cause unequal amounts of DNA from t1 and t2 to be sequenced so that an unequal amount of reads is produced
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
256
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
257 total = (float(arguments.reads1) + float(arguments.reads2))/2
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
258 cfactor1 = float(arguments.reads1)/total
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
259 cfactor2 = float(arguments.reads2)/total
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
260 print "Cfactor 1: " + str(cfactor1) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
261 print "Cfactor 2: " + str(cfactor2) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
262 import math
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
263 import csv
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
264 results = [["position", "strand", "count_1", "count_2", "ratio", "mt_freq_t1", "mt_freq_t2", "pop_freq_t1", "pop_freq_t2", "gene", "D", "W", "nW"]]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
265 genic = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
266 total_inserts = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
267 with open(arguments.ref_genome, "r") as file:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
268 firstline = file.readline()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
269 genomelength = firstline.split()[2]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
270 i = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
271 while i < float(genomelength):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
272
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
273 # At each possible location for an insertion in the genome, counts the number of actual insertions at t1 and which strand(s) the corresponding reads came from.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
274
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
275 c1 = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
276 if i in plus_ref_1:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
277 c1 = float(plus_ref_1[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
278 strand = "+/"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
279 if i in minus_ref_1:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
280 c1 += float(minus_ref_1[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
281 strand = "b/"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
282 elif i in minus_ref_1:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
283 c1 = float(minus_ref_1[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
284 strand = "-/"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
285
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
286 # If there were no insertions at a certain location at t1 just continues to the next location; there can't be any comparison to make between t1 and t2 if there are no t1 insertions!
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
287
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
288 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
289 i += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
290 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
291
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
292 # At each location where there was an insertion at t1, counts the number of insertions at t2 and which strand(s) the corresponding reads came from.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
293
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
294 c2 = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
295 if i in plus_ref_2:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
296 c2 = float(plus_ref_2[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
297 if i in minus_ref_2:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
298 c2 += float(minus_ref_2[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
299 strand += "b"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
300 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
301 strand += "+"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
302 elif i in minus_ref_2:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
303 c2 = float(minus_ref_2[i])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
304 strand += "-"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
305
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
306 # Corrects with cfactor1 and cfactor2
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
307
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
308 c1 /= cfactor1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
309 if c2 != 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
310 c2 /= cfactor2
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
311 ratio = c2/c1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
312 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
313 c2 = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
314 ratio = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
315
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
316 # Passes by all insertions with a number of reads smaller than the cutoff, as they may lead to inaccurate fitness calculations.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
317
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
318 if (c1 + c2)/2 < float(arguments.cutoff):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
319 i+= 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
320 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
321
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
322 # Calculates each insertion's frequency within the populations at t1 and t2.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
323
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
324 mt_freq_t1 = c1/total
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
325 mt_freq_t2 = c2/total
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
326 pop_freq_t1 = 1 - mt_freq_t1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
327 pop_freq_t2 = 1 - mt_freq_t2
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
328
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
329 # Calculates each insertion's fitness! This is from the fitness equation log((frequency of mutation @ time 2 / frequency of mutation @ time 1)*expansion factor)/log((frequency of population without the mutation @ time 2 / frequency of population without the mutation @ time 1)*expansion factor)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
330
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
331 w = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
332 if mt_freq_t2 != 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
333 top_w = math.log(mt_freq_t2*(float(arguments.expansion_factor)/mt_freq_t1))
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
334 bot_w = math.log(pop_freq_t2*(float(arguments.expansion_factor)/pop_freq_t1))
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
335 w = top_w/bot_w
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
336
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
337 # Checks which gene locus the insertion falls within, and records that.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
338
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
339 gene = ''
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
340 for feature_dictionary in feature_list:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
341 if feature_dictionary["start"] <= i and feature_dictionary["end"] >= i:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
342 gene = "".join(feature_dictionary["gene"])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
343 genic += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
344 break
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
345 total_inserts += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
346
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
347 # Writes all relevant information on each insertion and its fitness to a cvs file: the location of the insertion, its strand, c1, c2, etc. (the variable names are self-explanatiory)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
348 # w is written twice, because the second w will be normalized if normalization is called for, thus becoming nW.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
349
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
350 row = [i, strand, c1, c2, ratio, mt_freq_t1, mt_freq_t2, pop_freq_t1, pop_freq_t2, gene, arguments.expansion_factor, w, w]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
351 results.append(row)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
352 i += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
353 with open(arguments.outfile, "wb") as csvfile:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
354 writer = csv.writer(csvfile)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
355 writer.writerows(results)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
356
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
357 print "Done comparing mapfiles " + str(get_time()) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
358 print "Genic: " + str(genic) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
359 print "Total: " + str(total_inserts) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
360
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
361
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
362
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
363
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
364
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
365
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
366
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
367
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
368
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
369
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
370 ##### BOTTLENECK VALUE CALCULATION #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
371
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
372 #the bottleneck value is calculated here if done from all genes - otherwise it's done in the normalization section if only taken from normalization genes
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
373
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
374 if (arguments.bottleall):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
375 for list in results:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
376 if list[11] == 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
377 overall_blank_count += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
378 overall_original_count = len(results)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
379
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
380 pc_blank_normals = float(overall_blank_count) / float(overall_original_count)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
381
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
382 with open(arguments.outfile2, "w") as f:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
383 f.write("bottleneck_value: " + str(pc_blank_normals) + "\n" + "total: " + str(total) + "\n" + "refname: " + refname)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
384
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
385
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
386
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
387
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
388
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
389
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
390
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
391
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
392
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
393
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
394 ##### NORMALIZATION #####
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
395
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
396 # If making a WIG file is requested in the arguments, starts a string to be added to and then written to the WIG file with a typical WIG file header.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
397 # The header is just in a typical WIG file format; if you'd like to look into this more UCSC has notes on formatting WIG files on their site.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
398
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
399 if (arguments.wig):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
400 wigstring = "track type=wiggle_0 name=" + arguments.wig + "\n" + "variableStep chrom=" + refname + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
401
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
402 # Takes normalization genes (which should all be predicted or known to have fitness values of exactly 1.0, like transposons for example) and uses them to normalize the fitnesses of all insertion locations
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
403
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
404 if (arguments.normalize):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
405 with open(arguments.normalize) as file:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
406 transposon_genes = file.read().splitlines()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
407 print "Normalize genes loaded" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
408 blank_ws = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
409 sum = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
410 count = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
411 weights = []
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
412 scores = []
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
413 for list in results:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
414 if list[9] != '' and list[9] in transposon_genes:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
415 c1 = list[2]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
416 c2 = list[3]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
417 score = list[11]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
418 avg = (c1 + c2)/2
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
419
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
420 # Skips over those insertion locations with too few insertions - their fitness values are less accurate because they're based on such small insertion numbers.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
421
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
422 if float(c1) >= float(arguments.cutoff2):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
423
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
424 # Sets a max weight, to prevent insertion location scores with huge weights from unbalancing the normalization.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
425
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
426 if (avg >= float(arguments.max_weight)):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
427 avg = float(arguments.max_weight)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
428
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
429 # Tallies how many w values are 0 within the blank_ws value; you might get many transposon genes with a w value of 0 if a bottleneck occurs, for example, which is especially common with in vivo experiments. This is used later by aggregate.py
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
430 # For example, when studying a nasal infection in a mouse model, what bacteria "sticks" and is able to survive and what bacteria is swallowed and killed or otherwise flushed out tends to be a matter of chance not fitness; all mutants with an insertion in a specific transposon gene could be flushed out by chance!
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
431
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
432 if score == 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
433 blank_ws += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
434
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
435 sum += score
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
436 count += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
437 weights.append(avg)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
438 scores.append(score)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
439
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
440 print str(list[9]) + " " + str(score) + " " + str(c1)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
441
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
442 # Counts and removes all "blank" fitness values of normalization genes - those that = 0 - because they most likely don't really have a fitness value of 0, and you just happened to not get any reads from that location at t2.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
443
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
444 blank_count = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
445 original_count = len(scores)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
446 curr_count = original_count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
447 i = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
448 while i < curr_count:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
449 w_value = scores[i]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
450 if w_value == 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
451 blank_count += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
452 weights.pop(i)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
453 scores.pop(i)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
454 i -= 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
455 curr_count = len(scores)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
456 i += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
457
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
458 # If no normalization genes can pass the cutoff, normalization cannot occur, so this ends the script advises the user to try again and lower cutoff and/or cutoff2.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
459
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
460 if len(scores) == 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
461 print 'ERROR: The normalization genes do not have enough reads to pass cutoff and/or cutoff2; please lower one or both of those arguments.' + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
462 quit()
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
463
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
464 pc_blank_normals = float(blank_countv) / float(original_count)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
465 print "# blank out of " + str(original_count) + ": " + str(pc_blank_normals) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
466 if (!arguments.bottleall):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
467 with open(arguments.outfile2, "w") as f:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
468 f.write("bottleneck_value: " + str(pc_blank_normals) + "\n" + "total: " + str(total) + "\n" + "refname: " + refname)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
469
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
470 average = sum / count
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
471 i = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
472 weighted_sum = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
473 weight_sum = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
474 while i < len(weights):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
475 weighted_sum += weights[i]*scores[i]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
476 weight_sum += weights[i]
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
477 i += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
478 weighted_average = weighted_sum/weight_sum
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
479
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
480 print "Normalization step:" + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
481 print "Regular average: " + str(average) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
482 print "Weighted Average: " + str(weighted_average) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
483 print "Total Insertions: " + str(count) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
484
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
485 old_ws = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
486 new_ws = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
487 wcount = 0
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
488
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
489 for list in results:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
490 if list[11] == 'W':
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
491 continue
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
492 new_w = float(list[11])/weighted_average
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
493
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
494 # Sometimes you want to multiply all the fitness values by a constant; this does that.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
495 # For example you might multiply all the values by a constant for a genetic interaction screen - where Tn-Seq is performed as usual except there's one background knockout all the mutants share.
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
496
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
497 if arguments.multiply:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
498 new_w *= float(arguments.multiply)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
499
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
500 if float(list[11]) > 0:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
501 old_ws += float(list[11])
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
502 new_ws += new_w
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
503 wcount += 1
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
504
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
505 list[12] = new_w
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
506
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
507 if (arguments.wig):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
508 wigstring += str(list[0]) + " " + str(new_w) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
509
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
510 old_w_mean = old_ws / wcount
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
511 new_w_mean = new_ws / wcount
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
512 print "Old W Average: " + str(old_w_mean) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
513 print "New W Average: " + str(new_w_mean) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
514
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
515 with open(arguments.outfile, "wb") as csvfile:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
516 writer = csv.writer(csvfile)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
517 writer.writerows(results)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
518
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
519 if (arguments.wig):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
520 if (arguments.normalize):
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
521 with open(arguments.wig, "wb") as wigfile:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
522 wigfile.write(wigstring)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
523 else:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
524 for list in results:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
525 wigstring += str(list[0]) + " " + str(list[11]) + "\n"
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
526 with open(arguments.wig, "wb") as wigfile:
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
527 wigfile.write(wigstring)
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
528
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
529
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
530
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
531
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
532
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
533
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
534
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
535
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
536
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
537
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
538
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
539
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
540
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
541
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
542
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
543
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
544
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
545
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
546
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
547
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
548
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
549
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
550
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
551
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
552
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
553
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
554
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
555
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
556
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
557
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
558
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
559
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
560
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
561
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
562
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
563
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
564
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
565
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
566
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
567
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
568
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
569
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
570
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
571
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
572
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
573
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
574
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
575
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
576
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
577
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
578
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
579
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
580
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
581
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
582
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
583
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
584
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
585
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
586
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
587
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
588
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
589
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
590
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
591
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
592
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
593
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
594
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
595
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
596
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
597
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
598
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
599
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
600
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
601
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
602
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
603
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
604
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
605
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
606
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
607
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
608
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
609
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
610
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
611
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
612
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
613
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
614
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
615
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
616
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
617
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
618
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
619
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
620
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
621
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
622
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
623
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
624
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
625
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
626
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
627
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
628
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
629 # `````````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
630 # `````````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
631 # ``@@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
632 # ``@@@@@@@@@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
633 # ``@@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
634 # ``@@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
635 # ``@@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
636 # ``@@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
637 # ```@@@@@@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
638 # ```@@@@@@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
639 # ```@@@@@@@@+``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
640 # ```@@@@@@@@'``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
641 # ```@@@@@@@@;``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
642 # ```@@@@@@@@;``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
643 # ```@@@@@@@@:``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
644 # ```@@@@@@@@,``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
645 # ``.@@@@@@@@.``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
646 # ``.@@@@@@@@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
647 # ``.@@@@@@@@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
648 # ``.@@@@@@@@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
649 # ``.@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
650 # ``,@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
651 # ``,@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
652 # ``.@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
653 # ```@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
654 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
655 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
656 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
657 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
658 # ``'@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
659 # ``;@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
660 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
661 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
662 # ``:@@@@@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
663 # ``;@@@@@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
664 # ````+@@@@@@@#`````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
665 # ```````#@@@@@@@#``````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
666 # `````.,@@@@@@@@@...````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
667 # ``@@@@@@@@@@@@@@@@@@;``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
668 # ``@@@@@@@@@@@@@@@@@@;``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
669 # ```````````````````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
670 # `````````````````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
671 # ``````.```````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
672 # ````@.''```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
673 # ```# `;```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
674 # ``.+ @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
675 # ```@ ````,+```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
676 # ```;;````` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
677 # ```@ ``````,@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
678 # ```,+```..```@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
679 # ```@ ``....```@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
680 # ```+' ``....```#'``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
681 # ```@```......`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
682 # ```'+```......```'@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
683 # ```@ ``........```@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
684 # ```'#```........````@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
685 # ```@ ``..........```#,``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
686 # ```'#```...........`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
687 # ```@``.............```.+```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
688 # ```:#```.............`` #```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
689 # ``````` ```@ ```.......#......``.@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
690 # `````````` ```:@```#`......@......```@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
691 # ``````#@@@`` ```@ `.`:.......@.......`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
692 # ```.#@###@`` ```:@``..`+`....`@.......```@,``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
693 # ```'@####@``` ```@````..@@@@@@@@#,`..#```` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
694 # ```#####@@``` ``;@ ,`.,@@. `@@..#..```''``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
695 # ``:####@#```` ```@``@`@@ @@:...`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
696 # ```@#####```` ``,@``.@, ,@`...``:@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
697 # ``.####@``` ```@.` @` @....``@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
698 # ``####@``` ``,@ @.` @`.````@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
699 # ``@##@```` ```@, @: ;# `@..```@.``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
700 # ```@##```` ``.@`,@ @@, #...`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
701 # ```@#@``` ```@, # `@@@ @`.```;'``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
702 # ```##:`` ``.@ +, .@@@ ,'..`` @```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
703 # ``.##``` ```@, @ `@@@ @`.```,+```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
704 # `````@##``` ```@`'. @@@ :...```@``` ``````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
705 # ````````````````````````````````````````##@``` ```@:`@ @@@ #...`` #``` `````````````````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
706 # ```````````````````````````````````````.###@``` ```@ `, .@@@++'++#@@'` #`..```#``` ````````````'@@@@@.````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
707 # `````+@####################@@@@@@@@@@@@#####@``` ```#;`,. `@#...,.,,,,,,..;@, @....`` @``````````````+@@@########@.``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
708 # `+@##########################################,```` ```````````````@```@ +@,.,,,,,,,,,,,,,,,,,@ @....```#`````````'@@@##############@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
709 # `@###########################################@``````````````````````````````````````+'``.,'.#.,,,,,,,,,,,,,,,,,,,,.++@......`` @````+@@@#######@+``````'###'``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
710 # ``:@@########@@@@@@@@@@@@@@@@@@@@@@#@@@@@@@##@``````````````````````````......,`,,.,@ ```.##.,.,,,,,,,,,,,,,,,,,,,,.##......`` :.+@@#######@@:``````````###@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
711 # ````````````````````````````````,#########@###@@@@#################################@'```...@.,,,,,,,,,,,,,,,,,,,,,,,#.........`'@######@@+```````````````@##```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
712 # ```````````````````````````````@#########@#########################################```.....@:,,,,,,,,,,,,,,,,,,..;@..........`@####@@:```````` ```@##@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
713 # `````@@####@@@##########@@@@@@@@@@@@@@@@@@@@@@@@@@@@#+@+```......@#.,,,,,,,,,,,,,,,,.##..........`` #@#````````` ```##@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
714 # ``.#@######@####:```````````````````````````````````@ ``.......@:#,,,,,,,,,,,,,,,;@@`............`` @`````` ```@##:``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
715 # ``:########@###@```````````````````````````````````#;```......+..`##,.,,,,,,,,.#@#..'............`` @```` ``;##@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
716 # ```@@####@@##@'```` ````@ ``.......'.....@@#+;:;'#@@;`...#`............`` @``` ```@##```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
717 # ```````````````` ```@,```.............'..:''':.@`......:............```@.`` ``@###```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
718 # `````````````` ``.@```..............#........'`....................```@``` ``.##@``````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
719 # ```@.``..............`#........,.....................```@.`` ```@#+,``````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
720 # ``.@``.,,,,,,,,,,,,,,,,,,,,,,,,,,,,,,.................```@``` ````+#####@````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
721 # ```@````......,........................,....,,.,.,,,,,..` @,`` ```;@@######````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
722 # ``.@```.......,......................`......,...........```@``` ```+#########@````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
723 # ```@```...........`@@+...............+@@`....,...........```@:`` ``;@#########@'```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
724 # ``.@ ``............@@@@@`.........,@@@@@.....,............```@``` ``@#########@#@@```
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
725 # ```@.```............@@@@@@@`.....'@@@@@@@.....,............```#'`` ``@###@###@#@#@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
726 # ``.@```.............@@@@@@@@@..+#@@@@@@@@.....,.............`` #``` ``@#@@@@##@#@#@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
727 # ```@````.............@@@@@@@@@@@@@@@@@@@@@.....,.............```'#``` ``'#@@@@##@#@@@@@,`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
728 # ``.@ ``.........,....@@@@@@@@@',##@@@@@@@@`....,..............```@``` ```@@@@@##@@'#@@@@`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
729 # ```@.```.........,....@@@@@@@#`...`#@@@@@@@`....,..............```.@``` ``#@@@@##;```@@@@`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
730 # ``.@ ``.....,,,,,,,.,.@@@@@#.,,,,,,,.#@@@@@,,,,,,,,,,,,:,,,,,,,,.``@``` ``#@@@@#.````@@@@`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
731 # ```@. ``...............@@@;......,......#@@@`...........,.........```@``` ``#@@@;``````@@@@`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
732 # ```@```................@,........,........+#`...........,.........```@.`` ``#@@@;``````@@@@`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
733 # ```@.``...........................,.........`............,..........```@``` ``#@@@'`` ``#@@;`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
734 # ``.@ ``................,..........,......................,..........```#:`` ``#@@@'`` ```#@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
735 # ```@,``............................,......................,...........`` @``` ``+@@@'`` `````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
736 # ``.@```............................,......................,...........```#+`` ``;@@@+`` ``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
737 # ```@,``.............................,......................,............```@``` ``'@@@+``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
738 # ``.@```.........,...................,......................,............```'#``` ``;@@@+``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
739 # ```@:```.........,...................,......................,.............`` @``` ``:@@@+``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
740 # ```@`..,,,,,,,,,,,,,,,,,,..,.........,......................,.............```'@``` ``;@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
741 # ``+'```...,.................,....,,,,,,,,,,,,,,,,,,,,,,,,,,,,,..........,...``@``` ``;@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
742 # ```@ ``....,.................,.......................................,.......``;@``` ``:@@@#``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
743 # ``'#```....,.................,.......................................,.......```@``` ``:@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
744 # ```@```.....,.................,.......................................,........``;#`` ``:@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
745 # ```@ ``.....,.................,.......................................,........`` @``` ``:@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
746 # ``@````...............................................................,........`` @.`` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
747 # ``@ ```..............................................................,........`` .#`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
748 # ``# ``````.`.```````````````..````````````````````..`````````````````.`````````` @`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
749 # ``. `````````````````````````````````````````````````````````````````````````` .;`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
750 # ``@;` `` ` ` ` ` ```` ` ````` ` ` `,+@``` ``+@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
751 # `````:;'++##@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@@+.```` ``+@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
752 # ```````````````````````````+##@``````````````````@#@``````````````````````````````` ``+@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
753 # `````````````````````````@##@``````````````````@##;```````````````````````````` ``+@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
754 # ````###,```` ````+##@``` ``+@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
755 # ``,###``` ``.@##``` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
756 # ``###@`` ```@##``` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
757 # ```@##@`` ``@##+`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
758 # ```###.`` ``:##@`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
759 # ``:###``` ```##@``` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
760 # ``@##@`` ```@##``` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
761 # ```@##'`` ``@###`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
762 # ```@##``` ```##@`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
763 # ``,###``` ```@#@``` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
764 # ``####`` ``@##.`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
765 # ``@##@`` ``;##@`` ``'@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
766 # `````````@##@`` ```##@```` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
767 # ``````````````@##;`` ```###`````````````` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
768 # `````````.,;.```###``` ``@##:`````````````` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
769 # `````#@#########@@##``` ``###@@@@@@###@#@'``` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
770 # ```@@###############@`` ``,################`` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
771 # ``'@################+`` ```###############+`` ``;@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
772 # `````````````````````` ``###########@#,```` ``.@@@@``
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
773 # ````````````````````` ``````````````````` ```@@@.`
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
774 # ```````````````` ```````
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
775 #
369ad02454d8 Uploaded
kaymccoy
parents:
diff changeset
776 #