changeset 5:f504b3b7e49d draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/stringtie commit 65c9ce2fdc2b4ce892df8e456f18b859a85c410a
author iuc
date Wed, 21 Oct 2015 16:07:42 -0400
parents df42808cc33a
children d0bb240d7525
files stringtie.xml test-data/e2t.ctab test-data/e_data.ctab test-data/i2t.ctab test-data/i_data.ctab test-data/stringtie_out1.gtf test-data/stringtie_out2.gtf test-data/stringtie_out3.gtf test-data/stringtie_out4.gtf test-data/stringtie_out5.gtf test-data/stringtie_out6.gtf test-data/stringtie_out7.gtf test-data/t_data.ctab tool_dependencies.xml
diffstat 14 files changed, 81 insertions(+), 17 deletions(-) [+]
line wrap: on
line diff
--- a/stringtie.xml	Wed Aug 12 07:07:40 2015 -0400
+++ b/stringtie.xml	Wed Oct 21 16:07:42 2015 -0400
@@ -1,7 +1,7 @@
-<tool id="stringtie" name="StringTie" version="1.0.4">
+<tool id="stringtie" name="StringTie" version="1.1.0">
     <description>transcript assembly and quantification</description>
     <requirements>
-        <requirement type="package" version="1.0.4">stringtie</requirement>
+        <requirement type="package" version="1.1.0">stringtie</requirement>
     </requirements>
     <command><![CDATA[
 stringtie "$input_bam"
@@ -20,9 +20,14 @@
     -a "$option_set.min_anchor_len"
     -j "$option_set.min_anchor_cov"
     -c "$option_set.min_bundle_cov"
-    -s "$option_set.maxcov"
     -g "$option_set.bdist"
     -M "$option_set.bundle_fraction" $option_set.sensitive $option_set.disable_trimming
+    #if $option_set.A:
+        -A "$gene_abundance_estimation"
+    #end if
+    #if str($option_set.x).strip() != "":
+        -x "$option_set.x"
+    #end if
 #end if
 ]]>
 </command>
@@ -55,14 +60,18 @@
                 <param help="-a" label="Minimum anchor length for junctions" name="min_anchor_len" type="integer" value="10" />
                 <param help="-j" label="Minimum junction coverage" name="min_anchor_cov" type="integer" value="1" />
                 <param help="-c" label="Minimum bundle reads per bp coverage to consider for assembly" name="min_bundle_cov" type="integer" value="2" />
-                <param help="-s" label="Coverage saturation threshold" name="maxcov" type="integer" value="1000000" />
                 <param help="-g" label="Gap between read mappings triggering a new bundle" name="bdist" type="integer" value="50" />
                 <param help="-M" label="Fraction of bundle allowed to be covered by multi-hit reads" name="bundle_fraction" type="float" value="0.95" />
+                <param argument="-x" type="text" value="" label="Do not assemble any transcripts on these reference sequence(s)" help="e.g. chrM,chrX" />
+                <param argument="-A" truevalue="-A" falsevalue="" type="boolean" help="" label="Additional gene abundance estimation output file" />
             </when>
         </conditional>
     </inputs>
     <outputs>
         <data format="gtf" label="${tool.name} on ${on_string}: Assembled transcripts" name="output_gtf" />
+        <data format="tabular" label="${tool.name} on ${on_string}: Gene abundance estimates" name="gene_abundance_estimation">
+            <filter>option_set['A']</filter>
+        </data>
         <data format="gff3" label="${tool.name} on ${on_string}: Coverage" name="coverage">
             <filter>guide['use_guide'] == "yes"</filter>
         </data>
@@ -125,6 +134,25 @@
             <output file="stringtie_out5.gtf" ftype="gtf" name="output_gtf" lines_diff="2" />
             <output file="stringtie_out_coverage.gtf" ftype="gff3" name="coverage" />
         </test>
+        <test>
+            <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
+            <param name="use_guide" value="yes" />
+            <param name="guide_gff" value="stringtie_in.gtf" />
+            <param name="options" value="advanced" />
+            <param name="fraction" value="0.17" />
+            <param name="A" value="True" />
+            <output file="stringtie_out4.gtf" ftype="gtf" name="output_gtf" lines_diff="2" />
+            <output file="stringtie_out6.gtf" ftype="tabular" name="gene_abundance_estimation" />
+        </test>
+        <test>
+            <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
+            <param name="use_guide" value="yes" />
+            <param name="guide_gff" value="stringtie_in.gtf" />
+            <param name="options" value="advanced" />
+            <param name="fraction" value="0.15" />
+            <param name="c" value="test_chromosome" />
+            <output file="stringtie_out7.gtf" ftype="gtf" name="output_gtf" lines_diff="2" />
+        </test>
     </tests>
     <help>
 <![CDATA[
@@ -142,16 +170,13 @@
  -G reference annotation to use for guiding the assembly process (GTF/GFF3)
  -l name prefix for output transcripts (default: STRG)
  -f minimum isoform fraction (default: 0.1)
- -m minimum assembled transcript length to report (default 200bp)
+ -m minimum assembled transcript length (default: 200)
  -o output path/file name for the assembled transcripts GTF (default: stdout)
  -a minimum anchor length for junctions (default: 10)
  -j minimum junction coverage (default: 1)
  -t disable trimming of predicted transcripts based on coverage
     (default: coverage trimming is enabled)
  -c minimum reads per bp coverage to consider for transcript assembly (default: 2.5)
- -s coverage saturation threshold; further read alignments will be
-    ignored in a region where a local coverage depth of <maxcov> 
-    is reached (default: 1,000,000);
  -v verbose (log bundle processing details)
  -g gap between read mappings triggering a new bundle (default: 50)
  -C output file with reference transcripts that are covered by reads
@@ -162,6 +187,10 @@
  -b enable output of Ballgown table files but these files will be 
     created under the directory path given as <dir_path>
  -e only estimates the abundance of given reference transcripts (requires -G)
+ -A gene abundance estimation output file
+ -x do not assemble any transcripts on these reference sequence(s)
+
+
  ]]>
     </help>
     <citations>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/e2t.ctab	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,4 @@
+e_id	t_id
+1	1
+2	1
+3	1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/e_data.ctab	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,4 @@
+e_id	chr	strand	start	end	rcount	ucount	mrcount	cov	cov_sd	mcov	mcov_sd
+1	test_chromosome	+	53	250	158	158	158.00	49.7778	22.0747	49.7778	22.0747
+2	test_chromosome	+	351	400	73	73	73.00	54.1600	6.1753	54.1600	6.1753
+3	test_chromosome	+	501	550	38	38	38.00	21.6400	12.4350	21.6400	12.4350
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/i2t.ctab	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,3 @@
+i_id	t_id
+1	1
+2	1
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/i_data.ctab	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,3 @@
+i_id	chr	strand	start	end	rcount	ucount	mrcount
+1	test_chromosome	+	251	350	49	49	49.00
+2	test_chromosome	+	401	500	38	38	38.00
--- a/test-data/stringtie_out1.gtf	Wed Aug 12 07:07:40 2015 -0400
+++ b/test-data/stringtie_out1.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -1,4 +1,6 @@
-test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "44.724823"; FPKM "3276543.750000";
-test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "49.011967";
+# stringtie /tmp/tmpoOYb63/files/000/dataset_1.dat -o /tmp/tmpoOYb63/files/000/dataset_2.dat -p 1
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "44.682419"; FPKM "3273437.500000"; TPM "995243.375000";
+test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "48.948147";
 test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; cov "51.382565";
 test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; cov "21.090000";
--- a/test-data/stringtie_out2.gtf	Wed Aug 12 07:07:40 2015 -0400
+++ b/test-data/stringtie_out2.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -1,4 +1,6 @@
-test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "44.724823"; FPKM "3276543.750000";
-test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "49.011967";
+# stringtie /tmp/tmpoOYb63/files/000/dataset_9.dat -o /tmp/tmpoOYb63/files/000/dataset_10.dat -p 1 -l STRG -f 0.17 -m 200 -a 10 -j 1 -c 2 -g 50 -M 0.95
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; cov "44.682419"; FPKM "3273437.500000"; TPM "995243.375000";
+test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; cov "48.948147";
 test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; cov "51.382565";
 test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; cov "21.090000";
--- a/test-data/stringtie_out3.gtf	Wed Aug 12 07:07:40 2015 -0400
+++ b/test-data/stringtie_out3.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -1,4 +1,6 @@
-test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000";
+# stringtie /tmp/tmpoOYb63/files/000/dataset_16.dat -o /tmp/tmpoOYb63/files/000/dataset_18.dat -p 1 -C /tmp/tmpoOYb63/files/000/dataset_20.dat -G /tmp/tmpoOYb63/files/000/dataset_17.dat
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000"; TPM "996187.875000";
 test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "49.011967";
 test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "51.382565";
 test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "21.090000";
--- a/test-data/stringtie_out4.gtf	Wed Aug 12 07:07:40 2015 -0400
+++ b/test-data/stringtie_out4.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -1,4 +1,6 @@
-test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000";
+# stringtie /tmp/tmpoOYb63/files/000/dataset_35.dat -o /tmp/tmpoOYb63/files/000/dataset_37.dat -p 1 -C /tmp/tmpoOYb63/files/000/dataset_39.dat -G /tmp/tmpoOYb63/files/000/dataset_36.dat -l STRG -f 0.17 -m 200 -a 10 -j 1 -c 2 -g 50 -M 0.95 -A /tmp/tmpoOYb63/files/000/dataset_38.dat
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000"; TPM "996187.875000";
 test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "49.011967";
 test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "51.382565";
 test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "21.090000";
--- a/test-data/stringtie_out5.gtf	Wed Aug 12 07:07:40 2015 -0400
+++ b/test-data/stringtie_out5.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -1,4 +1,6 @@
-test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000";
+# stringtie /tmp/tmpoOYb63/files/000/dataset_25.dat -o /tmp/tmpoOYb63/files/000/dataset_27.dat -p 1 -C /tmp/tmpoOYb63/files/000/dataset_29.dat -G /tmp/tmpoOYb63/files/000/dataset_26.dat -b /tmp/tmpoOYb63/job_working_directory/000/13
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000"; TPM "996187.875000";
 test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "49.011967";
 test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "51.382565";
 test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "21.090000";
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/stringtie_out6.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,3 @@
+Gene ID	Gene Name	Strand	Start	End	Length	Coverage	FPKM	TPM
+CUFF.1	-	+	53	550	298	44.895973	3289082.250000	1000000.000000
+STRG.1	-	+	53	550	298	44.895973	3289082.250000	1000000.000000
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/stringtie_out7.gtf	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,6 @@
+# stringtie /tmp/tmpoOYb63/files/000/dataset_40.dat -o /tmp/tmpoOYb63/files/000/dataset_42.dat -p 1 -C /tmp/tmpoOYb63/files/000/dataset_43.dat -G /tmp/tmpoOYb63/files/000/dataset_41.dat -l STRG -f 0.15 -m 200 -a 10 -j 1 -c 2 -g 50 -M 0.95
+# StringTie version 1.1.0
+test_chromosome	StringTie	transcript	53	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "44.724823"; FPKM "3276543.750000"; TPM "996187.875000";
+test_chromosome	StringTie	exon	53	250	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "1"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "49.011967";
+test_chromosome	StringTie	exon	351	400	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "2"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "51.382565";
+test_chromosome	StringTie	exon	501	550	1000	+	.	gene_id "STRG.1"; transcript_id "STRG.1.1"; exon_number "3"; reference_id "CUFF.1.1"; ref_gene_id "CUFF.1"; cov "21.090000";
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/t_data.ctab	Wed Oct 21 16:07:42 2015 -0400
@@ -0,0 +1,2 @@
+t_id	chr	strand	start	end	t_name	num_exons	length	gene_id	gene_name	cov	FPKM
+1	test_chromosome	+	53	550	CUFF.1.1	3	298	CUFF.1	.	44.724823	3276543.750000
--- a/tool_dependencies.xml	Wed Aug 12 07:07:40 2015 -0400
+++ b/tool_dependencies.xml	Wed Oct 21 16:07:42 2015 -0400
@@ -1,6 +1,6 @@
 <?xml version="1.0"?>
 <tool_dependency>
-  <package name="stringtie" version="1.0.4">
-      <repository changeset_revision="f3818f4bc127" name="package_stringtie_1_0_4" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
+  <package name="stringtie" version="1.1.0">
+      <repository changeset_revision="62a98ebf406f" name="package_stringtie_1_1_0" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
     </package>
 </tool_dependency>