# HG changeset patch # User nitrozyna # Date 1516133720 18000 # Node ID d3dbf9e8a0e214954356a75ac742a07a5b8dcec1 # Parent a1cb5223ac3697d8a77c4b6c5d87db36977701da Uploaded diff -r a1cb5223ac36 -r d3dbf9e8a0e2 generate_data.py --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/generate_data.py Tue Jan 16 15:15:20 2018 -0500 @@ -0,0 +1,24 @@ +from __future__ import print_function +import math +import random +# that's our x data, i.e. reference +x = range(1, 101) + +# generate a gaussian +def gaussian(x, amp, cen, wid): + return amp * math.exp(-(x - cen) ** 2 / wid) + +read1 = 18 +read2 = 66 + +# that's our y data, i.e. reads +y = [int(round(gaussian(i, 20000, read1, 0.5) + gaussian(i, 20000, read2, 0.5) + random.gauss(200, 90))) for i in x] + +# that's our data printed in pairs (x_i, y_i) +with open("input.txt", "w") as f: + for pair in zip(x, y): + for p in pair: + print(p, end="\t", file=f) + print(file=f) + +# you have to set this manually to weed out all the noise. Every bit of noise should be below it.