changeset 3:039547ad8fb8 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/segemehl commit 21aaee40723b5341b4236edeb0e72995c2054053
author rnateam
date Fri, 16 Dec 2016 07:37:24 -0500
parents 0da425524259
children db367d012fa3
files segemehl.tar.gz segemehl.xml test-data/chr1.fa test-data/chr1.idx test-data/test.fastq test-data/testmap.sam tool_dependencies.xml
diffstat 7 files changed, 147 insertions(+), 33 deletions(-) [+]
line wrap: on
line diff
Binary file segemehl.tar.gz has changed
--- a/segemehl.xml	Thu Feb 05 08:25:13 2015 -0500
+++ b/segemehl.xml	Fri Dec 16 07:37:24 2016 -0500
@@ -1,14 +1,21 @@
-<tool id="segemehl" name="segemehl" version="0.1.6.0">
+<tool id="segemehl" name="segemehl" version="0.2.0">
     <description>based short read aligner</description>
     <requirements>
-        <requirement type="package" version="0.1.6">segemehl</requirement>
+        <requirement type="package" version="0.2.0">segemehl</requirement>
     </requirements>
+    <stdio>
+        <regex match="Exit forced"
+           source="both"
+           level="fatal"
+           description="Execution halted." />
+    </stdio>
     <command>
 <![CDATA[
         ## prepare segemehl index if no reference genome is supplied
-        temp_index = `mktemp`;
         #if $refGenomeSource.genomeSource == "history":
-            segemehl.x -x $temp_index -d $refGenomeSource.own_reference_genome;
+            mkdir ./temp_index/ &&
+	    #set $temp_index = './temp_index/temp.idx'
+	    segemehl.x -x $temp_index -d $refGenomeSource.own_reference_genome &&
         #else:
             #set $temp_index = $refGenomeSource.index.fields.index_path
         #end if
@@ -20,8 +27,11 @@
         ## number of threads
         -t "\${GALAXY_SLOTS:-12}"
 
-        ## db file path
-        -d ${refGenomeSource.index.fields.db_path}
+        #if $refGenomeSource.genomeSource == "history":
+	    -d $refGenomeSource.own_reference_genome
+        #else:
+            -d ${refGenomeSource.index.fields.db_path}
+        #end if
 
         -i $temp_index
 
@@ -29,8 +39,8 @@
         #if str( $library.type ) == "single":
             #set $query_list = list()
             ## prepare inputs
-            #for $fastq in $library.reads:
-                $query_list.append('%s' %($fastq.input_query))
+            #for $fastq in $library.input_query:
+                $query_list.append('%s' % $fastq )
             #end for
             -q "#echo ' '.join( $query_list )#"
         #else
@@ -61,18 +71,21 @@
         $autoclip
         $hardclip
         $order
+	$splits
+        #if $maxout:
+            --maxout $maxout
+        #end if
         -s
-        -o $segemehl_out
+
+        --minsplicecover $minsplicecover
+        --minfragscore $minfragscore
+        --minfraglen $minfraglen
+        --splicescorescale $splicescorescale
+
+        -o '$segemehl_out'
 ]]>
     </command>
-    <stdio>
-        <regex match="Exit forced"
-           source="both"
-           level="fatal"
-           description="Execution halted." />
-    </stdio>
     <inputs>
-
         <conditional name="refGenomeSource">
           <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
             <option value="indexed">Use a built-in index</option>
@@ -92,22 +105,20 @@
             </param>
           </when>  <!-- build-in -->
           <when value="history">
-            <param name="own_reference_genome" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
+              <param name="own_reference_genome" type="data" format="fasta" label="Select the reference genome" />
           </when>  <!-- history -->
         </conditional>  <!-- refGenomeSource -->
 
-
         <conditional name="library">
             <param name="type" type="select" label="Is this library paired-end?">
                 <option value="single">Single-end</option>
                 <option value="paired">Paired-end</option>
             </param>
             <when value="single">
-                <repeat name="reads" title="FASTQ/FASTA files">
-                    <param name="input_query" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Reads fasta/fastq file" />
-                </repeat>
+                <param name="input_query" type="data" multiple="True" format="fastqsanger,fastqillumina,fastq,fasta" label="Reads in FASTQ/FASTA files" />
             </when>
             <when value="paired">
+                <!-- ToDo paired coolections -->
                 <repeat name="mate_list" title="Paired End Pairs" min="1">
                     <param name="first_strand_query" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Reads from first strand" />
                     <param name="second_strand_query" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Reads from second strand" />
@@ -116,28 +127,43 @@
             </when>
         </conditional>
 
+        <param name="minsplicecover" type="integer" value="80" label="Min coverage for spliced transcripts" help="(--minsplicecover)" />
+        <param name="minfragscore" type="integer" value="18" label="Min coverage for spliced transcripts" help="(--minfragscore)" />
+        <param name="minfraglen" type="integer" value="20" label="Min length of a spliced fragment" help="(--minfraglen)" />
+        <param name="splicescorescale" type="float" value="1.0" label="Report spliced alignment with score greater than this scale times the score"
+            help="Report only if this value x score is larger than next best spliced alignment (--splicescorescale)" />
 
-        <param name="minsize" type="integer" value="12" size="5" label="Minimum size of queries" help="default: 12 (-m)">
-            <validator type="in_range" min="1"/>
-        </param>
-        <param name="accuracy" type="integer" value="85" size="5" label="Min percentage of matches per read in semi-global alignment" help="default: 85 (-A)" >
-            <validator type="in_range" min="1" max="100"/>
-        </param>
+        <param name="minsize" type="integer" value="12" min="1" label="Minimum size of queries" help="(-m)" />
+
+        <param name="maxout" type="integer" min="0" value="0" optional="True" 
+            label="Maximum number of alignments that will be reported" help="(--maxout)" />
+        <param name="accuracy" type="integer" value="85" min="1" max="100" label="Min percentage of matches per read in semi-global alignment" help="(-A)" />
+
         <param name="hitstrategy" type="select" label="Hits to report?" help="(-H)">
             <option value="1">report only best scoring hits</option>
             <option value="0">report all scoring hits</option>
         </param>
-        <param name="prime5" type="text" size="80" label="add 5' adapter" help="default: none (-Q)" />
-        <param name="prime3" type="text" size="80" label="add 3' adapter" help="default: none (-P)"/>
+        <param name="prime5" type="text" label="add 5' adapter" help="default: none (-Q)" />
+        <param name="prime3" type="text" label="add 3' adapter" help="default: none (-P)"/>
         <param name="polyA" type="boolean" truevalue="--polyA" falsevalue="" checked="false" label="Clip polyA tail" help="(-T)"/>
         <param name="autoclip" type="boolean" truevalue="--autoclip" falsevalue="" checked="false" label="Autoclip unknown 3prime adapter" help="(-Y)"/>
-        <param name="hardclip" type="boolean" truevalue="--hardclip" falsevalue="" checked="false" label="Enable hard clipping" help="-C"/>
+        <param name="hardclip" type="boolean" truevalue="--hardclip" falsevalue="" checked="false" label="Enable hard clipping" help="(-C)"/>
         <param name="order" type="boolean" truevalue="--order" falsevalue="" checked="false" label="Sorts the output by chromsome and position" help="(-O)"/>
+        <param name="splits" type="boolean" truevalue="--splits" falsevalue="" checked="false" label="Detect split/spliced reads" help="(--splits)"/>
     </inputs>
-
     <outputs>
         <data format="sam" name="segemehl_out" label="Read alignments on ${on_string}"/>
     </outputs>
+    <tests>
+      <test>
+	<param name="genomeSource" value="history" />
+        <param name="own_reference_genome" value="chr1.fa" />
+	<param name="library" value="single" />
+	<param name="input_query" value="test.fastq" />	
+	<param name="splits" value="true" />
+        <output name="segemehl_out" file="testmap.sam" lines_diff="2" />
+      </test>
+    </tests>
     <help>
 <![CDATA[
 
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/chr1.fa	Fri Dec 16 07:37:24 2016 -0500
@@ -0,0 +1,59 @@
+>TestChromosomeForGalaxy
+CACTGAATTGACCCTTGGCAATGGTCTGTTCCCGCACCCAACACCTGGCTCCACTACGTT
+GAAACACACACACACACACACACACACACACACACACACACACACACACGTGATATTTGC
+TTTTAAGATCATAAAACACCAGGAAGGAGACAAAAGCTCTTATGCGTCATCTGAGATGAC
+ACATGTACTGTTAAAGCGTGCGTTTATTTCAAACATTAATGAAATTTGCAGAACCCAAAC
+TAAAGAGAGAGGATAGATAAGACATGCTGCAGTTCTTGCCCTAACTTTCAATCCCAACAA
+CTGAAATGTCTTCCAGAGAAGTAACTCCCCCCGGTAAGGATGTAGCGCGGTCCCTACGTG
+GGTCTAAGGGATCTGACCCACGACGCACTGCACTGGGTTCACGAAGCGCCTCCTCGCAGG
+CGGTTATCTCGGTATCTCTGAGAGCGGCGGGCTCTCGCTCCCGCTCCAGGGATTCGGGGC
+AGAAAGAGAACATCCCACAGTTGGCGGGAGTTACGCAAGACAGTCAGACCCGGACGTCAC
+TCGTGAGTGCCCCGACCCCCCTCCACCCCAGAGGCGGGGCCATCGCCTTCCTTCCGAACT
+CGGGATCGATCTGGAGCTCCGGGAATTTCCCTGGCCCGGGACTCCGGGCTTTCCAGCCCC
+AACCATGCATAAAAGGGGTTCGCCGTTCTCGGAGAGCCACAGAGCCCGGGCCACAGGCAG
+CTCCTTGCCAGCTCTCCTCCTCGCACAGCCGCTCGAACCGCCTGCTGAGCCCCATGGCCC
+GCGCCACGCTCTCCGCCGCCCCCAGCAATCCCCGGCTCCTGCGGGTGGCGCTGCTGCTCC
+TGCTCCTGGTGGCCGCCAGCCGGCGCGCAGCAGGTGGGTCCCGGCGCCCTGGGGTCCCCG
+GGCCGGACGCGGCTGGGGTGGGCGCCCCGCGCCGACAGCCCCGCTCAATCAGCGAGTCTC
+TTCTTCCCTAGGAGCGCCCCTGGCCACTGAACTGCGCTGCCAGTGCTTGCAGACCCTGCA
+GGGAATTCACCTCAAGAACATCCAAAGTGTGAAGGTGAAGTCCCCCGGACCCCACTGCGC
+CCAAACCGAAGTCATGTAAGTCTCGCCCATCGCTGCCGCTGCCACTGCTGGGGTCCCCGA
+CTCTCCCGCTGCCCCAAACCCTGTCCTCAGCCCGACCTCCTGTCTCACGAGATTCCCTTC
+TCTCTGCAGAGCCACACTCAAGAATGGGCAGAAAGCTTGTCTCAACCCCGCATCGCCCAT
+GGTTAAGAAAATCATCGAAAAGATGCTGAAAAAGTAAGTTATAATTTCCATGTACACAGG
+CGACTGGAGCTGTTGGTCAGAAATACTGGCGTCTGCCCCCTAAAAAGTAAATCAGGAAAA
+CCCAGGGTTAGCTGCAGGACTGAAAAAATTATTATTTTCACAAAGTTGCCATTAAGGTTA
+TTAATCTGTTCTGGTGCCAGAGGATATTCCCAGTGCCCAGGGTCACCACCCAGGTTCTTC
+CCTCCTGCCAGTGAATGTAGGTAAAACTGCTTTCATGTAAGGTCTCATTGGAGTTTGCCA
+GTTGTGCTGAAGTGTTTTCCACCTGTTAAAAAACACAAGCTTCATTTCCCCTAGTTCCTA
+CTGACTTTCAGACCTGAAAAGCAGACCCCCTGGTTTTTTGTAAAAGTTTAGGGTTGAAGT
+GCAGAGATTTCACAATAATATTGCACTGGGTATATAACTGGTTGCCACCACCTATTAGCC
+ATGTCACTCAGAGACAATATTATTTAGTTTATCTGAGACTCAGCAAAACAGGGAAAATAA
+TGGTAGCTACATCATGAGGTTGCTTTGAGGCTCAAGTGAGGCCCAGTATGACAAAGAGCA
+ATAGGCTCTGGCTGTTTTAGCCAGTAAAACAGTGTAGACTGCCACTCCTCCACCCCACGT
+CACCCCCATTCCTAAAAGAGCATCCCAAGCCTAGAGGTCCTTGCCACACAGCACAGCTGT
+CACAGGCAGTACCCACTTGGGTGCCAGGCTGGGGAAACTGCATTCAGAAAACTCTAGAGC
+CTGGGGAAACAGGACAGGAGAAGACTGTTGTGCAGTCAGCTTTCCTGAGCACCTACTCAG
+GGCACCCATTTTCTCATTACAGTGGCAAATCCAACTGACCAGAAGGAAGGAGGAAGCTTA
+TTGGTGGCTGTTCCTGAAGGAGGCCCTGCCCTTACAGGAACAGAAGAGGAAAGAGAGACA
+CAGCTGCAGAGGCCACCTGGATTGCGCCTAATGTGTTTGAGCATCACTTAGGAGAAGTCT
+TCTATTTATTTATTTATTTATTTATTTGTTTGTTTTAGAAGATTCTATGTTAATATTTTA
+TGTGTAAAATAAGGTTATGATTGAATCTACTTGCACACTCTCCCATTATATTTATTGTTT
+ATTTTAGGTCAAACCCAAGTTAGTTCAATCCTGATTCATATTTAATTTGAAGATAGAAGG
+TTTGCAGATATTCTCTAGTCATTTGTTAATATTTCTTCGTGATGACATATCACATGTCAG
+CCACTGTGATAGAGGCTGAGGAATCCAAGAAAATGGCCAGTGAGATCAATGTGACGGCAG
+GGAAATGTATGTGTGTCTATTTTGTAACTGTAAAGATGAATGTCAGTTGTTATTTATTGA
+AATGATTTCACAGTGTGTGGTCAACATTTCTCATGTTGAAGCTTTAAGAACTAAAATGTT
+CTAAATATCCCTTGGACATTTTATGTCTTTCTTGTAAGGCATACTGCCTTGTTTAATGTT
+AATTATGCAGTGTTTCCCTCTGTGTTAGAGCAGAGAGGTTTCGATATTTATTGATGTTTT
+CACAAAGAACAGGAAAATAAAATATTTAAAAATATAAAATGTTTGTTTTATTTTGGGGGA
+AACAAGGACTATATTTGCTGAAAAATCTGATGATTTACATCAATATTTATTTCTCAATTT
+TTTTCTGGGTTTTCAATCTGCTATACAGATAAACTATGAATTATGCCTAATTTCATGTGG
+TGATTGCTGTCACTCCCCTTGGCTCTCACCTAGTAAAGAATGTGCCTTACCAAACTATGG
+TCTTGCCCCTGATGGGAGAATCACTGATACATATTGCCATTTTTACAAGAAGTTCCTTAC
+TACCTTGCTACTCAAATTTACCTCCTTAAAAATATGGAGGGGGGAAATATGGCAGAGACG
+TTTTAACCAGAGCAACTCCATCTTGAATAGGGGCTAGGCAAAATGGGGCTGAGGTTTACT
+GGGCTGGGCTGCATTCCCAGTAGGTTAGGCATTCGAAGTCACAGGATGAGATAGGAGATT
+GGCACAAGATACAGGTCATAAAGACCTTGCTGATAAAACAGGTTACAGTAAAGAAGCCAG
+CTAAAACCCACCAAAGCCAAGATGGAGACGAGAGTGACCTCTGTCGTTCTCACTCGTCAT
+TATACACTAATTATAATATATTAGCATGCTAAAAGACAC
\ No newline at end of file
Binary file test-data/chr1.idx has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test.fastq	Fri Dec 16 07:37:24 2016 -0500
@@ -0,0 +1,20 @@
+@10.516 HWI-EAS100R:1:1:550:1622/1
+CATGTACTGTTAAAGCGTGCGTTTATTTCAAACATTAATGAAATTTGCAGAACCCAAACTAAAGAGAGAG
++
+3MIa!,$)8EA)!1>tMJ{:2WrL`s|`gg{]'0+Op!6RxNw;V)XKV#Go5}b!`_V]A?!F>{LM(z
+@10.2869 HWI-EAS100R:1:1:1698:585/1
+AACCATGCATAAAAGGGGTTCGCCGTTCTCGGAGAGCCACAGAGCCCGGGCCACAGGCAGCTCCTTGCCA
++
+Q-a;@)*!F]Za^4!P*B?&!!No!^76b+X[6eOgr1$3:-Ywg;!Vzj!`=+e>YV|ok_z!D<2+jx
+@10.2085 HWI-EAS100R:1:1:32:109/2
+GGGAATTCACCTCAAGAACATCCAAAGTGTGAAGGTGAAGTCCCCCGGACCCCACTGCGCCCAAACCGAA
++
+V:e@~!I\GQ>>]?)-qpe!nVI4IJ+4!wE{YoSsVrr~P;PnY/.!a;~!S"n+J#St-g!lQdGA9;
+@10.2869 HWI-EAS100R:1:1:1698:585/2
+CGACTGGAGCTGTTGGTCAGAAATACTGGCGTCTGCCCCCTAATGGCAAATCCAACTGACCAGAAGGAAG
++
+btOb!D1"=hSm"'G_#I{b!!l#6JQ&iq4A`F%Uug!x!'h7o<%qCKQEtM)!bP>!."DvsX9T}=
+@10.516 HWI-EAS100R:1:1:550:1623/1
+CATGTACTGTTAAAGCGTGCGTTTATTTCAAACATTAATGAAATTTGCAGAACCCAAACTAAAGAGAGAG
++
+3MIa!,$)8EA)!1>tMJ{:2WrL`s|`gg{]'0+Op!6RxNw;V)XKV#Go5}b!`_V]A?!F>{LM(z
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/testmap.sam	Fri Dec 16 07:37:24 2016 -0500
@@ -0,0 +1,9 @@
+@HD	VN:1.0
+@SQ	SN:TestChromosomeForGalaxy	LN:3459
+@PG	ID:segemehl	VN:0.2.0-$Rev: 418 $ ($Date: 2015-01-05 05:17:35 -0500 (Mon, 05 Jan 2015) $)	CL:segemehl.x -i chr1.idx -d chr1.fa -q test.fastq -S -m 12 -A 85 -H 1 --minsplicecover 80 --minfragscore 18 --minfraglen 20 --splicescorescale 1.0
+10.516 HWI-EAS100R:1:1:550:1622/1	0	TestChromosomeForGalaxy	182	255	70M	*	0	0	CATGTACTGTTAAAGCGTGCGTTTATTTCAAACATTAATGAAATTTGCAGAACCCAAACTAAAGAGAGAG	3MIa!,$)8EA)!1>tMJ{:2WrL`s|`gg{]'0+Op!6RxNw;V)XKV#Go5}b!`_V]A?!F>{LM(z	NM:i:0	MD:Z:70	NH:i:1	XI:i:0	XA:Z:Q
+10.2869 HWI-EAS100R:1:1:1698:585/1	0	TestChromosomeForGalaxy	661	255	70M	*	0	0	AACCATGCATAAAAGGGGTTCGCCGTTCTCGGAGAGCCACAGAGCCCGGGCCACAGGCAGCTCCTTGCCA	Q-a;@)*!F]Za^4!P*B?&!!No!^76b+X[6eOgr1$3:-Ywg;!Vzj!`=+e>YV|ok_z!D<2+jx	NM:i:0	MD:Z:70	NH:i:1	XI:i:0	XA:Z:Q
+10.2085 HWI-EAS100R:1:1:32:109/2	0	TestChromosomeForGalaxy	1021	255	70M	*	0	0	GGGAATTCACCTCAAGAACATCCAAAGTGTGAAGGTGAAGTCCCCCGGACCCCACTGCGCCCAAACCGAA	V:e@~!I\GQ>>]?)-qpe!nVI4IJ+4!wE{YoSsVrr~P;PnY/.!a;~!S"n+J#St-g!lQdGA9;	NM:i:0	MD:Z:70	NH:i:1	XI:i:0	XA:Z:Q
+10.2869 HWI-EAS100R:1:1:1698:585/2	0	TestChromosomeForGalaxy	1321	255	43M	*	0	0	CGACTGGAGCTGTTGGTCAGAAATACTGGCGTCTGCCCCCTAA	btOb!D1"=hSm"'G_#I{b!!l#6JQ&iq4A`F%Uug!x!'h	NM:i:0	MD:Z:43	NH:i:1	XI:i:0	XL:i:2	XA:Z:Q	XX:i:1	XY:i:43	XQ:i:0	XC:Z:TestChromosomeForGalaxy	XV:i:2123	XT:i:32
+10.2869 HWI-EAS100R:1:1:1698:585/2	0	TestChromosomeForGalaxy	2123	255	27M	*	0	0	TGGCAAATCCAACTGACCAGAAGGAAG	7o<%qCKQEtM)!bP>!."DvsX9T}=	NM:i:0	MD:Z:27	NH:i:1	XI:i:0	XL:i:2	XA:Z:Q	XX:i:44	XY:i:70	XQ:i:1	XP:Z:TestChromosomeForGalaxy	XU:i:1363	XS:i:64
+10.516 HWI-EAS100R:1:1:550:1623/1	0	TestChromosomeForGalaxy	182	255	70M	*	0	0	CATGTACTGTTAAAGCGTGCGTTTATTTCAAACATTAATGAAATTTGCAGAACCCAAACTAAAGAGAGAG	3MIa!,$)8EA)!1>tMJ{:2WrL`s|`gg{]'0+Op!6RxNw;V)XKV#Go5}b!`_V]A?!F>{LM(z	NM:i:0	MD:Z:70	NH:i:1	XI:i:0	XA:Z:Q
--- a/tool_dependencies.xml	Thu Feb 05 08:25:13 2015 -0500
+++ b/tool_dependencies.xml	Fri Dec 16 07:37:24 2016 -0500
@@ -1,6 +1,6 @@
 <?xml version="1.0"?>
 <tool_dependency>
-    <package name="segemehl" version="0.1.6">
-        <repository changeset_revision="7078b80ffc12" name="package_segemehl_0_1_6" owner="rnateam" toolshed="https://toolshed.g2.bx.psu.edu" />
+    <package name="segemehl" version="0.2.0">
+        <repository changeset_revision="11cce9ae6cc6" name="package_segemehl_0_2_0" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
     </package>
 </tool_dependency>