Mercurial > repos > mheinzl > fsd
annotate fsd.py @ 1:770a38352a51 draft
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit 2847d08dae94bb2307768c99badcf49ec302fc74-dirty
author | mheinzl |
---|---|
date | Thu, 03 May 2018 13:33:14 -0400 |
parents | 9736b9d04a0b |
children | 648d5df50ca8 |
rev | line source |
---|---|
0
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
1 #!/usr/bin/env python |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
2 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
3 # Family size distribution of SSCSs |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
4 # |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
5 # Author: Monika Heinzl, Johannes-Kepler University Linz (Austria) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
6 # Contact: monika.heinzl@edumail.at |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
7 # |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
8 # Takes at least one TABULAR file with tags before the alignment to the SSCS, but up to 4 files can be provided, as input. |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
9 # The program produces a plot which shows the distribution of family sizes of the all SSCSs from the input files and |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
10 # a CSV file with the data of the plot, as well as a TXT file with all tags of the DCS and their family sizes. |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
11 # If only one file is provided, then a family size distribution, which is separated after SSCSs without a partner and DCSs, is produced. |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
12 # Whereas a family size distribution with multiple data in one plot is produced, when more than one file (up to 4) is given. |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
13 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
14 # USAGE: python FSD_Galaxy_1.4_commandLine_FINAL.py filename --inputFile2 filename2 --inputFile3 filename3 --inputFile4 filename4 / |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
15 # --title_file outputFileName --sep "characterWhichSeparatesCSVFile" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
16 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
17 import numpy |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
18 import matplotlib.pyplot as plt |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
19 from matplotlib.backends.backend_pdf import PdfPages |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
20 import argparse |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
21 import sys |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
22 import os |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
23 import re |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
24 from Cheetah.Template import Template |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
25 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
26 def readFileReferenceFree(file): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
27 with open(file, 'r') as dest_f: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
28 data_array = numpy.genfromtxt(dest_f, skip_header=0, delimiter='\t', comments='#', dtype='string') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
29 return(data_array) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
30 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
31 def make_argparser(): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
32 parser = argparse.ArgumentParser(description='Family Size Distribution of duplex sequencing data') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
33 parser.add_argument('inputFile', |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
34 help='Tabular File with three columns: ab or ba, tag and family size.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
35 parser.add_argument('--inputName1') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
36 parser.add_argument('--inputFile2',default=None, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
37 help='Tabular File with three columns: ab or ba, tag and family size.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
38 parser.add_argument('--inputName2') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
39 parser.add_argument('--inputFile3',default=None, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
40 help='Tabular File with three columns: ab or ba, tag and family size.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
41 parser.add_argument('--inputName3') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
42 parser.add_argument('--inputFile4',default=None, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
43 help='Tabular File with three columns: ab or ba, tag and family size.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
44 parser.add_argument('--inputName4') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
45 parser.add_argument('--sep', default=",", |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
46 help='Separator in the csv file.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
47 parser.add_argument('--output_csv', default="data.csv",type=str, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
48 help='Name of the pdf and csv file.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
49 parser.add_argument('--output_pdf', default="data.pdf",type=str, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
50 help='Name of the pdf and csv file.') |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
51 return parser |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
52 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
53 def compare_read_families(argv): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
54 parser = make_argparser() |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
55 args=parser.parse_args(argv[1:]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
56 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
57 firstFile = args.inputFile |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
58 name1 = args.inputName1 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
59 secondFile = args.inputFile2 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
60 name2 = args.inputName2 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
61 thirdFile = args.inputFile3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
62 name3 = args.inputName3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
63 fourthFile = args.inputFile4 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
64 name4 = args.inputName4 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
65 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
66 title_file = args.output_csv |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
67 title_file2 = args.output_pdf |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
68 sep = args.sep |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
69 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
70 if type(sep) is not str or len(sep)>1: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
71 print("Error: --sep must be a single character.") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
72 exit(4) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
73 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
74 plt.rc('figure', figsize=(11.69, 8.27)) # A4 format |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
75 plt.rcParams['patch.edgecolor'] = "black" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
76 plt.rcParams['axes.facecolor'] = "E0E0E0" # grey background color |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
77 plt.rcParams['xtick.labelsize'] = 12 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
78 plt.rcParams['ytick.labelsize'] = 12 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
79 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
80 list_to_plot = [] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
81 label = [] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
82 data_array_list = [] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
83 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
84 with open(title_file, "w") as output_file, PdfPages(title_file2) as pdf: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
85 fig = plt.figure() |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
86 plt.subplots_adjust(bottom=0.25) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
87 if firstFile != str(None): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
88 file1 = readFileReferenceFree(firstFile) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
89 integers = numpy.array(file1[:, 0]).astype(int) ## keep original family sizes |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
90 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
91 # for plot: replace all big family sizes by 22 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
92 data1 = numpy.array(file1[:, 0]).astype(int) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
93 bigFamilies = numpy.where(data1 > 20)[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
94 data1[bigFamilies] = 22 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
95 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
96 name1 = name1.split(".tabular")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
97 list_to_plot.append(data1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
98 label.append(name1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
99 data_array_list.append(file1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
100 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
101 legend = "\n\n\n{}".format(name1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
102 plt.text(0.1, 0.11, legend, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
103 legend1 = "singletons:\nabsolute nr.\n{:,}".format(numpy.bincount(data1)[1]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
104 plt.text(0.4, 0.11, legend1, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
105 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
106 legend3 = "rel. freq\n{:.3f}".format(float(numpy.bincount(data1)[1]) / len(data1)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
107 plt.text(0.5, 0.11, legend3, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
108 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
109 legend4 = "family size > 20:\nabsolute nr.\n{:,}".format( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
110 numpy.bincount(data1)[len(numpy.bincount(data1)) - 1].astype(int)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
111 plt.text(0.6, 0.11, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
112 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
113 legend5 = "rel. freq\n{:.3f}".format(float(numpy.bincount(data1)[len(numpy.bincount(data1)) - 1]) / len(data1)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
114 plt.text(0.7, 0.11, legend5, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
115 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
116 legend6 = "total length\n{:,}".format(len(data1)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
117 plt.text(0.8, 0.11, legend6, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
118 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
119 if secondFile != str(None): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
120 file2 = readFileReferenceFree(secondFile) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
121 data2 = numpy.asarray(file2[:, 0]).astype(int) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
122 bigFamilies2 = numpy.where(data2 > 20)[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
123 data2[bigFamilies2] = 22 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
124 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
125 list_to_plot.append(data2) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
126 name2 = name2.split(".tabular")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
127 label.append(name2) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
128 data_array_list.append(file2) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
129 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
130 plt.text(0.1, 0.09, name2, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
131 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
132 legend1 = "{:,}".format(numpy.bincount(data2)[1]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
133 plt.text(0.4, 0.09, legend1, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
134 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
135 legend3 = "{:.3f}".format(float(numpy.bincount(data2)[1]) / len(data2)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
136 plt.text(0.5, 0.09, legend3, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
137 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
138 legend4 = "{:,}".format(numpy.bincount(data2)[len(numpy.bincount(data2)) - 1].astype(int)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
139 plt.text(0.6, 0.09, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
140 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
141 legend5 = "{:.3f}".format(float(numpy.bincount(data2)[len(numpy.bincount(data2)) - 1]) / len(data2)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
142 plt.text(0.7, 0.09, legend5, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
143 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
144 legend6 = "{:,}".format(len(data2)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
145 plt.text(0.8, 0.09, legend6, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
146 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
147 if thirdFile != str(None): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
148 file3 = readFileReferenceFree(thirdFile) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
149 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
150 data3 = numpy.asarray(file3[:, 0]).astype(int) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
151 bigFamilies3 = numpy.where(data3 > 20)[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
152 data3[bigFamilies3] = 22 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
153 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
154 list_to_plot.append(data3) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
155 name3 = name3.split(".tabular")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
156 label.append(name3) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
157 data_array_list.append(file3) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
158 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
159 plt.text(0.1, 0.07, name3, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
160 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
161 legend1 = "{:,}".format(numpy.bincount(data3)[1]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
162 plt.text(0.4, 0.07, legend1, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
163 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
164 legend3 = "{:.3f}".format(float(numpy.bincount(data3)[1]) / len(data3)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
165 plt.text(0.5, 0.07, legend3, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
166 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
167 legend4 = "{:,}".format(numpy.bincount(data3)[len(numpy.bincount(data3)) - 1].astype(int)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
168 plt.text(0.6, 0.07, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
169 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
170 legend5 = "{:.3f}".format(float(numpy.bincount(data3)[len(numpy.bincount(data3)) - 1]) / len(data3)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
171 plt.text(0.7, 0.07, legend5, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
172 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
173 legend6 = "{:,}".format(len(data3)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
174 plt.text(0.8, 0.07, legend6, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
175 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
176 if fourthFile != str(None): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
177 file4 = readFileReferenceFree(fourthFile) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
178 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
179 data4 = numpy.asarray(file4[:, 0]).astype(int) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
180 bigFamilies4 = numpy.where(data4 > 20)[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
181 data4[bigFamilies4] = 22 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
182 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
183 list_to_plot.append(data4) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
184 name4 = name4.split(".tabular")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
185 label.append(name4) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
186 data_array_list.append(file4) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
187 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
188 plt.text(0.1, 0.05, name4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
189 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
190 legend1 = "{:,}".format(numpy.bincount(data4)[1]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
191 plt.text(0.4, 0.05, legend1, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
192 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
193 legend4 = "{:.3f}".format(float(numpy.bincount(data4)[1]) / len(data4)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
194 plt.text(0.5, 0.05, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
195 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
196 legend4 = "{:,}".format(numpy.bincount(data4)[len(numpy.bincount(data4)) - 1].astype(int)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
197 plt.text(0.6, 0.05, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
198 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
199 legend5 = "{:.3f}".format(float(numpy.bincount(data4)[len(numpy.bincount(data4)) - 1]) / len(data4)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
200 plt.text(0.7, 0.05, legend5, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
201 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
202 legend6 = "{:,}".format(len(data4)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
203 plt.text(0.8, 0.05, legend6, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
204 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
205 maximumX = numpy.amax(numpy.concatenate(list_to_plot)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
206 minimumX = numpy.amin(numpy.concatenate(list_to_plot)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
207 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
208 counts = plt.hist(list_to_plot, bins=range(minimumX, maximumX + 1), stacked=False, edgecolor="black", |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
209 linewidth=1, label=label, align="left", alpha=0.7, rwidth=0.8) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
210 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
211 ticks = numpy.arange(minimumX - 1, maximumX, 1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
212 ticks1 = map(str, ticks) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
213 ticks1[len(ticks1) - 1] = ">20" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
214 plt.xticks(numpy.array(ticks), ticks1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
215 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
216 plt.legend(loc='upper right', fontsize=14, frameon=True, bbox_to_anchor=(0.9, 1)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
217 plt.title("Family Size Distribution", fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
218 plt.xlabel("No. of Family Members", fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
219 plt.ylabel("Absolute Frequency", fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
220 plt.margins(0.01, None) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
221 plt.grid(b=True, which="major", color="#424242", linestyle=":") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
222 pdf.savefig(fig) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
223 plt.close() |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
224 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
225 # write data to CSV file |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
226 output_file.write("Values from family size distribution with all datasets\n") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
227 output_file.write("\nFamily size") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
228 for i in label: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
229 output_file.write("{}{}".format(sep, i)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
230 output_file.write("{}sum".format(sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
231 output_file.write("\n") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
232 j = 0 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
233 for fs in counts[1][0:len(counts[1]) - 1]: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
234 if fs == 21: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
235 fs = ">20" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
236 else: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
237 fs = "={}".format(fs) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
238 output_file.write("FS{}{}".format(fs, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
239 values_of_fs = [] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
240 if len(label) == 1: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
241 output_file.write("{}{}".format(int(counts[0][j]), sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
242 values_of_fs.append(int(counts[0][j])) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
243 else: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
244 for n in range(len(label)): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
245 output_file.write("{}{}".format(int(counts[0][n][j]), sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
246 values_of_fs.append(int(counts[0][n][j])) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
247 output_file.write("{}\n".format(sum(values_of_fs))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
248 j += 1 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
249 output_file.write("sum{}".format(sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
250 values_for_sum = [] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
251 if len(label) == 1: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
252 output_file.write("{}{}".format(int(sum(counts[0])), sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
253 values_for_sum.append(int(sum(counts[0]))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
254 else: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
255 for i in counts[0]: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
256 output_file.write("{}{}".format(int(sum(i)), sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
257 values_for_sum.append(int(sum(i))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
258 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
259 output_file.write("{}\n".format(sum(values_for_sum))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
260 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
261 ### Family size distribution after DCS and SSCS |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
262 for dataset, data, name_file in zip(list_to_plot, data_array_list, label): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
263 maximumX = numpy.amax(dataset) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
264 minimumX = numpy.amin(dataset) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
265 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
266 tags = numpy.array(data[:, 2]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
267 seq = numpy.array(data[:, 1]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
268 data = numpy.array(dataset) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
269 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
270 # find all unique tags and get the indices for ALL tags, but only once |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
271 u, index_unique, c = numpy.unique(numpy.array(seq), return_counts=True, return_index=True) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
272 d = u[c > 1] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
273 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
274 # get family sizes, tag for duplicates |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
275 duplTags_double = data[numpy.in1d(seq, d)] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
276 duplTags = duplTags_double[0::2] # ab of DCS |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
277 duplTagsBA = duplTags_double[1::2] # ba of DCS |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
278 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
279 duplTags_double_tag = tags[numpy.in1d(seq, d)] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
280 duplTags_double_seq = seq[numpy.in1d(seq, d)] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
281 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
282 # get family sizes for SSCS with no partner |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
283 ab = numpy.where(tags == "ab")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
284 abSeq = seq[ab] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
285 ab = data[ab] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
286 ba = numpy.where(tags == "ba")[0] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
287 baSeq = seq[ba] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
288 ba = data[ba] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
289 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
290 dataAB = ab[numpy.in1d(abSeq, d, invert=True)] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
291 dataBA = ba[numpy.in1d(baSeq, d, invert=True)] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
292 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
293 # write DCS tags to file |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
294 # with open("DCS information_{}.txt".format(firstFile), "w") as file: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
295 # for t, s, f in zip(duplTags_double_tag, duplTags_double_seq, duplTags_double): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
296 # file.write("{}\t{}\t{}\n".format(t, s, f)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
297 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
298 list1 = [duplTags_double, dataAB, dataBA] # list for plotting |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
299 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
300 ## information for family size >= 3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
301 dataAB_FS3 = dataAB[dataAB >= 3] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
302 dataBA_FS3 = dataBA[dataBA >= 3] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
303 ab_FS3 = ab[ab >= 3] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
304 ba_FS3 = ba[ba >= 3] |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
305 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
306 duplTags_FS3 = duplTags[(duplTags >= 3) & (duplTagsBA >= 3)] # ab+ba with FS>=3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
307 duplTags_FS3_BA = duplTagsBA[(duplTags >= 3) & (duplTagsBA >= 3)] # ba+ab with FS>=3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
308 duplTags_double_FS3 = len(duplTags_FS3)+len(duplTags_FS3_BA) # both ab and ba strands with FS>=3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
309 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
310 fig = plt.figure() |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
311 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
312 plt.subplots_adjust(bottom=0.3) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
313 counts = plt.hist(list1, bins=range(minimumX, maximumX + 1), stacked=True, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
314 label=["duplex", "ab", "ba"], edgecolor="black", linewidth=1, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
315 align="left", color=["#FF0000", "#5FB404", "#FFBF00"]) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
316 # tick labels of x axis |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
317 ticks = numpy.arange(minimumX - 1, maximumX, 1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
318 ticks1 = map(str, ticks) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
319 ticks1[len(ticks1) - 1] = ">20" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
320 plt.xticks(numpy.array(ticks), ticks1) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
321 singl = counts[0][2][0] # singletons |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
322 last = counts[0][2][len(counts[0][0]) - 1] # large families |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
323 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
324 plt.legend(loc='upper right', fontsize=14, bbox_to_anchor=(0.9, 1), frameon=True) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
325 plt.title(name1, fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
326 plt.xlabel("No. of Family Members", fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
327 plt.ylabel("Absolute Frequency", fontsize=14) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
328 plt.margins(0.01, None) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
329 plt.grid(b=True, which="major", color="#424242", linestyle=":") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
330 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
331 ## extra information beneath the plot |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
332 legend = "SSCS ab= \nSSCS ba= \nDCS (total)= \nlength of dataset=" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
333 plt.text(0.1, 0.09, legend, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
334 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
335 legend = "absolute numbers\n\n{:,}\n{:,}\n{:,} ({:,})\n{:,}" \ |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
336 .format(len(dataAB), len(dataBA), len(duplTags), len(duplTags_double), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
337 (len(dataAB) + len(dataBA) + len(duplTags))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
338 plt.text(0.35, 0.09, legend, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
339 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
340 legend = "relative frequencies\nunique\n{:.3f}\n{:.3f}\n{:.3f}\n{:,}" \ |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
341 .format(float(len(dataAB)) / (len(dataAB) + len(dataBA) + len(duplTags)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
342 float(len(dataBA)) / (len(dataAB) + len(dataBA) + len(duplTags)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
343 float(len(duplTags)) / (len(dataAB) + len(dataBA) + len(duplTags)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
344 (len(dataAB) + len(dataBA) + len(duplTags))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
345 plt.text(0.54, 0.09, legend, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
346 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
347 legend = "total\n{:.3f}\n{:.3f}\n{:.3f} ({:.3f})\n{:,}" \ |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
348 .format(float(len(dataAB)) / (len(ab) + len(ba)), float(len(dataBA)) / (len(ab) + len(ba)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
349 float(len(duplTags)) / (len(ab) + len(ba)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
350 float(len(duplTags_double)) / (len(ab) + len(ba)), (len(ab) + len(ba))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
351 plt.text(0.64, 0.09, legend, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
352 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
353 legend1 = "\nsingletons:\nfamily size > 20:" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
354 plt.text(0.1, 0.03, legend1, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
355 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
356 legend4 = "{:,}\n{:,}".format(singl.astype(int), last.astype(int)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
357 plt.text(0.35, 0.03, legend4, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
358 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
359 legend3 = "{:.3f}\n{:.3f}".format(singl / len(data),last / len(data)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
360 plt.text(0.54, 0.03, legend3, size=12, transform=plt.gcf().transFigure) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
361 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
362 pdf.savefig(fig) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
363 plt.close() |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
364 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
365 # write same information to a csv file |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
366 count = numpy.bincount(integers) # original counts of family sizes |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
367 output_file.write("\nDataset:{}{}\n".format(sep, name_file)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
368 output_file.write("max. family size:{}{}\n".format(sep, max(integers))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
369 output_file.write("absolute frequency:{}{}\n".format(sep, count[len(count) - 1])) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
370 output_file.write("relative frequency:{}{:.3f}\n\n".format(sep, float(count[len(count) - 1]) / sum(count))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
371 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
372 output_file.write("{}singletons:{}{}family size > 20:\n".format(sep, sep, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
373 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
374 "{}absolute nr.{}rel. freq{}absolute nr.{}rel. freq{}total length\n".format(sep, sep, sep, sep, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
375 output_file.write("{}{}{}{}{:.3f}{}{}{}{:.3f}{}{}\n\n".format(name_file, sep, singl.astype(int), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
376 singl / len(data), sep,last.astype(int), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
377 last / len(data), sep, len(data))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
378 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
379 ## information for FS >= 1 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
380 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
381 "The unique frequencies were calculated from the dataset where the tags occured only once (=ab without DCS, ba without DCS)\n" \ |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
382 "Whereas the total frequencies were calculated from the whole dataset (=including the DCS).\n\n") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
383 output_file.write("FS >= 1{}{}unique:{}total:\n".format(sep, sep, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
384 output_file.write("nr./rel. freq of ab={}{}{}{:.3f}{}{:.3f}\n".format(sep, len(dataAB), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
385 float(len(dataAB)) / (len(dataAB) + len(dataBA) + len( duplTags)), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
386 float(len(dataAB)) / (len(ab) + len(ba)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
387 output_file.write("nr./rel. freq of ba={}{}{}{:.3f}{}{:.3f}\n".format(sep, len(dataBA), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
388 float(len(dataBA)) / (len(dataBA) + len(dataBA) + len(duplTags)), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
389 float(len(dataBA)) / (len(ba) + len(ba)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
390 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
391 "nr./rel. freq of DCS (total)={}{} ({}){}{:.3f}{}{:.3f} ({:.3f})\n".format(sep, len(duplTags), len(duplTags_double), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
392 float(len(duplTags)) / ( len(dataAB) + len( dataBA) + len(duplTags)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
393 sep, float(len(duplTags)) / ( len(ab) + len(ba)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
394 float( len(duplTags_double)) / (len(ab) + len(ba)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
395 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
396 "length of dataset={}{}{}{}{}{}\n".format(sep, (len(dataAB) + len(dataBA) + len(duplTags)), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
397 (len(dataAB) + len(dataBA) + len(duplTags)), sep,(len(ab) + len(ba)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
398 ## information for FS >= 3 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
399 output_file.write("FS >= 3{}{}unique:{}total:\n".format(sep, sep, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
400 output_file.write("nr./rel. freq of ab={}{}{}{:.3f}{}{:.3f}\n".format(sep, len(dataAB_FS3), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
401 float(len(dataAB_FS3)) / (len(dataAB_FS3) + len(dataBA_FS3) + len(duplTags_FS3)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
402 sep, float(len(dataAB_FS3)) / ( len(ab_FS3) + len(ba_FS3)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
403 output_file.write("nr./rel. freq of ba={}{}{}{:.3f}{}{:.3f}\n".format(sep, len(dataBA_FS3), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
404 float(len(dataBA_FS3)) / ( len(dataBA_FS3) + len(dataBA_FS3) + len(duplTags_FS3)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
405 sep,float(len(dataBA_FS3)) / (len(ba_FS3) + len(ba_FS3)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
406 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
407 "nr./rel. freq of DCS (total)={}{} ({}){}{:.3f}{}{:.3f} ({:.3f})\n".format(sep, len(duplTags_FS3),duplTags_double_FS3, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
408 sep, float(len( duplTags_FS3)) / (len(dataBA_FS3) + len(duplTags_FS3)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
409 sep, float(len(duplTags_FS3)) / (len(ab_FS3) + len(ba_FS3)), |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
410 float(duplTags_double_FS3) / (len(ab_FS3) + len(ba_FS3)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
411 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
412 "length of dataset={}{}{}{}{}{}\n".format(sep, (len(dataAB_FS3) + len(dataBA_FS3) + len(duplTags_FS3)), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
413 (len(dataAB_FS3) + len(dataBA_FS3) + len(duplTags_FS3)), sep, |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
414 (len(ab_FS3) + len(ba_FS3)))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
415 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
416 output_file.write("\nValues from family size distribution\n") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
417 output_file.write("{}duplex{}ab{}ba{}sum\n".format(sep, sep, sep, sep)) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
418 for dx, ab, ba, fs in zip(counts[0][0], counts[0][1], counts[0][2], counts[1]): |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
419 if fs == 21: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
420 fs = ">20" |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
421 else: |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
422 fs = "={}".format(fs) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
423 ab1 = ab - dx |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
424 ba1 = ba - ab |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
425 output_file.write( |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
426 "FS{}{}{}{}{}{}{}{}{}\n".format(fs, sep, int(dx), sep, int(ab1), sep, int(ba1), sep, int(ba))) |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
427 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
428 print("Files successfully created!") |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
429 |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
430 if __name__ == '__main__': |
9736b9d04a0b
planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd commit f674213e798956531c935e7b9eb7f444286d0a5e-dirty
mheinzl
parents:
diff
changeset
|
431 sys.exit(compare_read_families(sys.argv)) |