changeset 4:3288cc5a57e5 draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/master/tools/blast_to_scaffold commit fb47b9859a0703f1fa4a1e76b75b9dae29ca8329
author drosofff
date Fri, 25 Mar 2016 19:21:26 -0400
parents e279e53a3fde
children 81ffa74cf96e
files blast_to_scaffold.py blast_to_scaffold.xml test-data/assembly.fa
diffstat 3 files changed, 14 insertions(+), 8 deletions(-) [+]
line wrap: on
line diff
--- a/blast_to_scaffold.py	Fri Mar 25 19:14:20 2016 -0400
+++ b/blast_to_scaffold.py	Fri Mar 25 19:21:26 2016 -0400
@@ -30,6 +30,10 @@
         '--blast-tab', dest="blast_tab", action="store", type=str, help="13-columns tabular blastn or tblastx output")
     the_parser.add_argument(
         '--output', action="store", type=str, help="output file path, fasta format")
+    the_parser.add_argument(
+        '--scaffold_prefix', action="store", type=str, help="the prefix that will be used for the header of the fasta scaffold")
+    the_parser.add_argument(
+        '--scaffold_suffix', action="store", type=str, help="the sufix that will be used for the header of the fasta scaffold")
     args = the_parser.parse_args()
     return args
     
@@ -98,13 +102,13 @@
         for i, nucleotide in enumerate(sequence):
             GuideDict[i+subjectStart] = nucleotide
             
-def finalAssembly (GuideDict, outputfile):
+def finalAssembly (GuideDict, outputfile, prefix, suffix):
     finalSeqList = []
     for keys in sorted(GuideDict):
         finalSeqList.append(GuideDict[keys])
     finalSequence = insert_newlines("".join(finalSeqList) )
     Out = open (outputfile, "w")
-    print >> Out, ">Scaffold"
+    print >> Out, ">Scaffold_from_%s_guided_by_%s" % (prefix, suffix)
     print >> Out, finalSequence
     Out.close()
     
@@ -114,7 +118,7 @@
     GuideDict = myGuide (args.guideSequence)
     blastlist = blatnInfo(args.blast_tab)
     updateGuide(blastlist, GuideDict, ContigsDict)
-    finalAssembly(GuideDict, args.output)
+    finalAssembly(GuideDict, args.output, args.scaffold_prefix, args.scaffold_suffix)
 
 if __name__ == "__main__":
     __main__()
--- a/blast_to_scaffold.xml	Fri Mar 25 19:14:20 2016 -0400
+++ b/blast_to_scaffold.xml	Fri Mar 25 19:21:26 2016 -0400
@@ -1,12 +1,14 @@
-<tool id="blast2scaffold" name="blast_to_scaffold" version="0.1.0">
+<tool id="blast2scaffold" name="blast_to_scaffold" version="0.9.0">
 <description>Generate DNA scaffold from blastn or tblastx alignment of Contigs</description>
 <requirements>
 </requirements>
 <command interpreter="python">
         blast_to_scaffold.py --sequences "$sequences"
-                              --guideSequence "$guideSequence"
-                              --blast-tab "$blast_tab"
-                              --output "$output"
+                             --guideSequence "$guideSequence"
+                             --blast-tab "$blast_tab"
+                             --output "$output"
+                             --scaffold_prefix "$sequences.element_identifier"
+                             --scaffold_suffix "$guideSequence.element_identifier"
 </command>
 <inputs>
 <param name="sequences" type="data" format="fasta" label="Select a fasta contigs file"/> 
--- a/test-data/assembly.fa	Fri Mar 25 19:14:20 2016 -0400
+++ b/test-data/assembly.fa	Fri Mar 25 19:21:26 2016 -0400
@@ -1,4 +1,4 @@
->Scaffold
+>Scaffold_from_contigs.fa_guided_by_guideSequence.fa
 gcaaaaaggcccctgggGGGGGGTTAATGAGTACTGGAAAAAGAAGCGCGAGATACCACT
 TCGCTGATTATGCTGATTCTGGTATTAAGGATTAGTAGAGTATCGGAAGTGCCGAAGGGA
 ATAATGCTGGTCCGTTGTAAACAGGATACTTATGAGACCTCTTAACAGAAACTTTGAGCA