fsd_bvsa: fsd_beforevsafter.py comparison

comparison fsd_beforevsafter.py @ 2:e8115b71edbd draft

planemo upload for repository https://github.com/monikaheinzl/galaxyProject/tree/master/tools/fsd_beforevsafter commit b9403b3ce2b7a41fa8ee1aa47909152de78cf641

author	mheinzl
date	Tue, 15 May 2018 13:50:02 -0400
parents	6716b1cddf3e
children	327c40a821ed

comparison

equal deleted inserted replaced

-:6ed6dca9488f
+:e8115b71edbd
 # a TABULAR file with tags before the alignment to the SSCS, a FASTA file with reads that were part of the DCS and
 # a FASTA file with tags after trimming as input (optional).
 # The program produces a plot which shows the distribution of family sizes of the DCS from the input files and
 # a CSV file with the data of the plot.
-# USAGE: python FSD before vs after_no_refF1.3_FINAL.py --inputFile_SSCS filenameSSCS --makeDCS filenameMakeDCS --afterTrimming filenameAfterTrimming -- alignedTags filenameTagsRefGenome
+# USAGE: python FSD before vs after_no_refF1.3_FINAL.py --inputFile_SSCS filenameSSCS --inputName1 filenameSSCS --makeDCS filenameMakeDCS --afterTrimming filenameAfterTrimming -- alignedTags filenameTagsRefGenome
 # --sep "characterWhichSeparatesCSVFile" --output_csv outptufile_name_csv --output_pdf outptufile_name_pdf
 import numpy
 import matplotlib.pyplot as plt
 def make_argparser():
 parser = argparse.ArgumentParser(description='Analysis of read loss in duplex sequencing data')
 parser.add_argument('--inputFile_SSCS',
 help='Tabular File with three columns: ab or ba, tag and family size.')
+parser.add_argument('--inputName1')
 parser.add_argument('--makeDCS',
 help='FASTA File with information about tag and family size in the header.')
 parser.add_argument('--afterTrimming',default=None,
 help='FASTA File with information about tag and family size in the header.')
 parser.add_argument('--alignedTags',default=None,
 def compare_read_families_read_loss(argv):
 parser = make_argparser()
 args = parser.parse_args(argv[1:])
 SSCS_file = args.inputFile_SSCS
+SSCS_file_name = args.inputName1
 makeConsensus = args.makeDCS
 afterTrimming = args.afterTrimming
 ref_genome = args.alignedTags
 title_file = args.output_csv
 title_file2 = args.output_pdf
 with open(title_file, "w") as output_file, PdfPages(title_file2) as pdf:
 ### PLOT ###
 plt.rc('figure', figsize=(11.69, 8.27))  # A4 format
 plt.rcParams['axes.facecolor'] = "E0E0E0"  # grey background color
-plt.rcParams['xtick.labelsize'] = 12
+plt.rcParams['xtick.labelsize'] = 14
-plt.rcParams['ytick.labelsize'] = 12
+plt.rcParams['ytick.labelsize'] = 14
 plt.rcParams['patch.edgecolor'] = "black"
 fig = plt.figure()
 plt.subplots_adjust(bottom=0.3)
 list1 = []
 legend4 = "* In the plot, the family sizes of ab and ba strands and of both duplex tags were used.\nWhereas the total numbers indicate only the single count of the formed duplex tags."
 plt.text(0.1, 0.02, legend4, size=11, transform=plt.gcf().transFigure)
 plt.legend(loc='upper right', fontsize=14, bbox_to_anchor=(0.9, 1), frameon=True)
-plt.title("Family Size Distribution of Tags from various Steps of the Galaxy Pipeline", fontsize=14)
+plt.title("Family size distribution of tags from various steps of the Du Novo pipeline", fontsize=14)
-plt.xlabel("No. of Family Members", fontsize=12)
+plt.xlabel("Family size", fontsize=14)
-plt.ylabel("Absolute Frequency", fontsize=12)
+plt.ylabel("Absolute Frequency", fontsize=14)
 plt.grid(b=True, which="major", color="#424242", linestyle=":")
 plt.margins(0.01, None)
 pdf.savefig(fig, bbox_inch="tight")
 plt.close()
 # write information about plot into a csv file
-output_file.write("Dataset:{}{}\n".format(sep, SSCS_file))
+output_file.write("Dataset:{}{}\n".format(sep, SSCS_file_name))
 if ref_genome != str(None):
 output_file.write("{}AB{}BA\n".format(sep, sep))
 output_file.write("max. family size:{}{}{}{}\n".format(sep, max(quant_ab_ref), sep, max(quant_ba_ref)))
 output_file.write(
 "absolute frequency:{}{}{}{}\n".format(sep, count[len(count) - 1], sep, count2[len(count2) - 1]))

Mercurial > repos > mheinzl > fsd_bvsa

comparison fsd_beforevsafter.py @ 2:e8115b71edbd draft