view PDAUG_Peptide_Length_Distribution/PDAUG_Peptide_Length_Distribution.py @ 4:87b77f2ddb0c draft

"planemo upload for repository https://github.com/jaidevjoshi83/pdaug commit 8b18552f6d2b2261efebe1075ff4c18a295b94dd"
author jay
date Tue, 29 Dec 2020 18:13:00 +0000
parents c3f0b3a6339e
children
line wrap: on
line source

import matplotlib.pyplot as plt
import Bio
from Bio import SeqIO
import os


def LegnthDestribution(InFile, OutFile):


    sizes = [len(rec.seq) for rec in SeqIO.parse(InFile, "fasta")]

    plt.hist(sizes, bins=20)
    plt.title("%i Negative bacteriocin sequences\nLengths %i to %i" \
                % (len(sizes),min(sizes),max(sizes)))
    plt.xlabel("Sequence length (bp)")
    plt.ylabel("Count")

    plt.savefig(OutFile)



if __name__=="__main__":

    import argparse
    
    parser = argparse.ArgumentParser()
    
    parser.add_argument("-I", "--InFile", required=True, default=None, help="Input file name")
    parser.add_argument("-O", "--OutFile", required=False, default="Out.png", help="Input file name")
    args = parser.parse_args()
    LegnthDestribution(args.InFile, args.OutFile)