1
|
1 <tool id="stringtie" name="StringTie" version="1.0.1">
|
0
|
2 <description>RNA-Seq assembler</description>
|
|
3 <requirements>
|
1
|
4 <requirement type="package" version="1.0.1">stringtie</requirement>
|
0
|
5 </requirements>
|
1
|
6 <command><![CDATA[
|
0
|
7 stringtie "$input_bam"
|
|
8 -o "$output_gtf"
|
|
9 -p "\${GALAXY_SLOTS:-1}"
|
|
10 #if str($guide.use_guide) == 'yes':
|
1
|
11 -C "$coverage" -G "$guide.guide_gff" $guide.input_estimation
|
|
12 #if str($guide.output_ballgown) == '-b':
|
|
13 $guide.output_ballgown `pwd`
|
|
14 #end if
|
0
|
15 #end if
|
|
16 #if str($option_set.options) == 'advanced':
|
1
|
17 -l "$option_set.name_prefix"
|
0
|
18 -f "$option_set.fraction"
|
|
19 -m "$option_set.min_tlen"
|
|
20 -a "$option_set.min_anchor_len"
|
|
21 -j "$option_set.min_anchor_cov"
|
|
22 -c "$option_set.min_bundle_cov"
|
|
23 -s "$option_set.maxcov"
|
|
24 -g "$option_set.bdist"
|
|
25 -M "$option_set.bundle_fraction" $option_set.sensitive $option_set.disable_trimming
|
|
26 #end if
|
|
27 ]]>
|
|
28 </command>
|
|
29 <inputs>
|
1
|
30 <param format="bam" label="BAM file to assemble" name="input_bam" type="data" />
|
0
|
31 <conditional name="guide">
|
1
|
32 <param label="Use GFF file to guide assembly" name="use_guide" type="select">
|
0
|
33 <option value="yes">Use GFF</option>
|
1
|
34 <option selected="True" value="no">Do not use GFF</option>
|
0
|
35 </param>
|
|
36 <when value="no" />
|
|
37 <when value="yes">
|
1
|
38 <param format="gtf,gff3" help="(-G)" label="Reference annotation to use for guiding the assembly process" name="guide_gff" type="data" />
|
|
39 <param falsevalue="" help="(-e)" label="Perform abundance estimation only of input transcripts" name="input_estimation" truevalue="-e" type="boolean" />
|
|
40 <param falsevalue="" help="(-b)" label="Output additional files for use in Ballgown" name="output_ballgown" truevalue="-b" type="boolean" />
|
0
|
41 </when>
|
|
42 </conditional>
|
|
43 <conditional name="option_set">
|
1
|
44 <param label="Options" name="options" type="select">
|
|
45 <option selected="True" value="default">Use defaults</option>
|
0
|
46 <option value="advanced">Specify advanced options</option>
|
|
47 </param>
|
|
48 <when value="default" />
|
|
49 <when value="advanced">
|
1
|
50 <param falsevalue="" help="(-t)" label="Disable trimming of predicted transcripts based on coverage" name="disable_trimming" truevalue="-t" type="boolean" />
|
|
51 <param falsevalue="" help="(-S)" label="Increase sensitivity" name="sensitive" truevalue="-S" type="boolean" />
|
|
52 <param help="(-l)" label="Name prefix for output transcripts" name="name_prefix" type="text" value="STRG" />
|
|
53 <param help="(-f)" label="Minimum isoform fraction" max="1.0" min="0.0" name="fraction" type="float" value="0.15" />
|
|
54 <param help="(-m)" label="Minimum assembled transcript length" name="min_tlen" type="integer" value="200" />
|
|
55 <param help="(-a)" label="Minimum anchor length for junctions" name="min_anchor_len" type="integer" value="10" />
|
|
56 <param help="(-j)" label="Minimum junction coverage" name="min_anchor_cov" type="integer" value="1" />
|
|
57 <param help="(-c)" label="Minimum bundle reads per bp coverage to consider for assembly" name="min_bundle_cov" type="integer" value="2" />
|
|
58 <param help="(-s)" label="Coverage saturation threshold" name="maxcov" type="integer" value="1000000" />
|
|
59 <param help="(-g)" label="Gap between read mappings triggering a new bundle" name="bdist" type="integer" value="50" />
|
|
60 <param help="(-M)" label="Fraction of bundle allowed to be covered by multi-hit reads" name="bundle_fraction" type="float" value="0.95" />
|
|
61 </when>
|
0
|
62 </conditional>
|
|
63 </inputs>
|
|
64 <outputs>
|
1
|
65 <data format="gtf" label="${tool.name} on ${on_string}: Assembled transcripts" name="output_gtf" />
|
|
66 <data format="gff3" label="${tool.name} on ${on_string}: Coverage" name="coverage">
|
0
|
67 <filter>guide['use_guide'] == "yes"</filter>
|
|
68 </data>
|
1
|
69 <data format="tabular" from_work_dir="e_data.ctab" label="${tool.name} on ${on_string}: exon-level expression measurements" name="exon_expression">
|
|
70 <filter>guide['output_ballgown']</filter>
|
|
71 </data>
|
|
72 <data format="tabular" from_work_dir="i_data.ctab" label="${tool.name} on ${on_string}: intron-level expression measurements" name="intron_expression">
|
|
73 <filter>guide['output_ballgown']</filter>
|
|
74 </data>
|
|
75 <data format="tabular" from_work_dir="t_data.ctab" label="${tool.name} on ${on_string}: transcript-level expression measurements" name="transcript_expression">
|
|
76 <filter>guide['output_ballgown']</filter>
|
|
77 </data>
|
|
78 <data format="tabular" from_work_dir="e2t.ctab" label="${tool.name} on ${on_string}: exon to transcript mapping" name="exon_transcript_mapping">
|
|
79 <filter>guide['output_ballgown']</filter>
|
|
80 </data>
|
|
81 <data format="tabular" from_work_dir="i2t.ctab" label="${tool.name} on ${on_string}: intron to transcript mapping" name="intron_transcript_mapping">
|
|
82 <filter>guide['output_ballgown']</filter>
|
|
83 </data>
|
0
|
84 </outputs>
|
|
85 <tests>
|
|
86 <test>
|
1
|
87 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
|
0
|
88 <param name="use_guide" value="no" />
|
|
89 <param name="options" value="default" />
|
1
|
90 <output file="stringtie_out1.gtf" ftype="gtf" name="output_gtf" />
|
0
|
91 </test>
|
|
92 <test>
|
1
|
93 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
|
0
|
94 <param name="use_guide" value="no" />
|
|
95 <param name="options" value="advanced" />
|
|
96 <param name="fraction" value="0.17" />
|
1
|
97 <output file="stringtie_out2.gtf" ftype="gtf" name="output_gtf" />
|
|
98 </test>
|
|
99 <test>
|
|
100 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
|
|
101 <param name="use_guide" value="yes" />
|
|
102 <param name="guide_gff" value="stringtie_in.gtf" />
|
|
103 <param name="options" value="default" />
|
|
104 <output file="stringtie_out3.gtf" ftype="gtf" name="output_gtf" />
|
|
105 </test>
|
|
106 <test>
|
|
107 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
|
|
108 <param name="use_guide" value="yes" />
|
|
109 <param name="guide_gff" value="stringtie_in.gtf" />
|
|
110 <param name="options" value="advanced" />
|
|
111 <param name="fraction" value="0.17" />
|
|
112 <output file="stringtie_out4.gtf" ftype="gtf" name="output_gtf" />
|
|
113 </test>
|
|
114 <test>
|
|
115 <param ftype="bam" name="input_bam" value="stringtie_in1.bam" />
|
|
116 <param name="use_guide" value="yes" />
|
|
117 <param name="output_ballgown" value="yes" />
|
|
118 <param name="guide_gff" value="stringtie_in.gtf" />
|
|
119 <param name="options" value="default" />
|
|
120 <output file="ballgown/e_data.ctab" ftype="tabular" name="exon_expression" />
|
|
121 <output file="ballgown/i_data.ctab" ftype="tabular" name="intron_expression" />
|
|
122 <output file="ballgown/t_data.ctab" ftype="tabular" name="transcript_expression" />
|
|
123 <output file="ballgown/e2t.ctab" ftype="tabular" name="exon_transcript_mapping" />
|
|
124 <output file="ballgown/i2t.ctab" ftype="tabular" name="intron_transcript_mapping" />
|
|
125 <output file="stringtie_out5.gtf" ftype="gtf" name="output_gtf" />
|
|
126 <output file="stringtie_out_coverage.gtf" ftype="gff3" name="coverage" />
|
0
|
127 </test>
|
|
128 </tests>
|
|
129 <help>
|
|
130 <![CDATA[
|
1
|
131 StringTie v1.0.1 usage:
|
|
132 stringtie <input.bam> [-G <guide_gff>] [-l <label>] [-o <out_gtf>] [-p <cpus>]
|
|
133 [-v] [-a <min_anchor_len>] [-m <min_tlen>] [-j <min_anchor_cov>] [-n sens]
|
|
134 [-C <coverage_file_name>] [-s <maxcov>] [-c <min_bundle_cov>] [-g <bdist>]
|
|
135 {-B | -b <dir_path>} [-e]
|
0
|
136
|
1
|
137 Assemble RNA-Seq alignments into potential transcripts.
|
|
138
|
|
139 Options:
|
|
140 -G reference annotation to use for guiding the assembly process (GTF/GFF3)
|
|
141 -l name prefix for output transcripts (default: STRG)
|
|
142 -f minimum isoform fraction (default: 0.1)
|
|
143 -m minimum assembled transcript length to report (default 200bp)
|
|
144 -o output path/file name for the assembled transcripts GTF (default: stdout)
|
|
145 -a minimum anchor length for junctions (default: 10)
|
|
146 -j minimum junction coverage (default: 1)
|
|
147 -t disable trimming of predicted transcripts based on coverage
|
|
148 (default: coverage trimming is enabled)
|
|
149 -c minimum reads per bp coverage to consider for transcript assembly (default: 2.5)
|
|
150 -s coverage saturation threshold; further read alignments will be
|
|
151 ignored in a region where a local coverage depth of <maxcov>
|
|
152 is reached (default: 1,000,000);
|
|
153 -v verbose (log bundle processing details)
|
|
154 -g gap between read mappings triggering a new bundle (default: 50)
|
|
155 -C output file with reference transcripts that are covered by reads
|
|
156 -M fraction of bundle allowed to be covered by multi-hit reads (default:0.95)
|
|
157 -p number of threads (CPUs) to use (default: 1)
|
|
158 -B enable output of Ballgown table files which will be created in the
|
|
159 same directory as the output GTF (requires -G, -o recommended)
|
|
160 -b enable output of Ballgown table files but these files will be
|
|
161 created under the directory path given as <dir_path>
|
|
162 -e only estimates the abundance of given reference transcripts (requires -G)
|
|
163 ]]>
|
|
164 </help>
|
|
165 <citations>
|
|
166 <citation type="doi">doi:10.1038/nbt.3122</citation>
|
|
167 </citations>
|
|
168 </tool>
|