annotate sortmerna_wrapper.xml @ 0:2e7f0da431e3 draft default tip

Uploaded version 1.0
author bonsai
date Tue, 30 Apr 2013 13:12:35 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
1 <?xml version="1.0" encoding="utf-8"?>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
2 <tool id="sortmerna_wrapper" version="1.0" name="Filter with SortMeRNA">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
3 <requirements>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
4 <requirement type='package' version="1.7">sortmerna</requirement>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
5 </requirements>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
6 <description>Fast and accurate filtering of ribosomal RNAs in metatranscriptomic data</description>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
7 <command interpreter="python">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
8 sortmerna_wrapper.py
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
9 --sortmerna "
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
10 $strand_search
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
11 #if str( $read_family.read_family_selector ) == 'other':
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
12 --I $input_reads -r $read_family.ratio_parameter
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
13 #else:
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
14 $read_family.read_family_selector $input_reads
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
15 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
16 #if str( $sequencing_type.sequencing_type_selector ) == 'paired':
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
17 $sequencing_type.paired_type
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
18 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
19
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
20 #if $outputs_selected:
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
21 #if 'accept' in $outputs_selected.value:
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
22 --accept accept_file
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
23 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
24 #if 'other' in $outputs_selected.value:
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
25 --other other_file
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
26 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
27 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
28 $log
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
29 #if str( $options.options_type_selector ) == 'more':
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
30 -a $options.number_of_threads
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
31 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
32 "
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
33 #if str( $databases_type.databases_selector ) == 'history':
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
34 --buildtrie
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
35 #for $db in $databases_type.input_databases
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
36 $db.database_name
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
37 #end for
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
38 #else:
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
39 ## databases path is not directly accessible, must match by hand with LOC file contents
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
40 ${' '.join([dict([(x[0], x[2]) for x in $databases_type.input_databases.input.options.tool_data_table.data])[y]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
41 for y in $databases_type.input_databases.value])}
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
42 #end if
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
43 </command>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
44 <inputs>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
45 <conditional name="read_family">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
46 <param name="read_family_selector" type="select" format="text"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
47 help="The Illumina platform is more common for large scale metatranscriptomic projects requiring a high throughput.">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
48 <label>Sequencing technology of querying sequences (reads)</label>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
49 <option value="--I">Illumina Solexa</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
50 <option value="--454">454 Roche</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
51 <option value="other">Other</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
52 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
53 <when value="other">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
54 <param name="ratio_parameter" type="float" value="1" min="0" max="1"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
55 label="Ratio parameter (the number of hits on the read / read length)"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
56 help="The ratio parameter for SortMeRNA has been set to r=0.25 for Illumina Solexa reads and to r=0.15 for 454 Roche reads.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
57 For other read types, if the sequencing technology produces high quality reads with a low substitution error rate
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
58 (0.1 substitutions per 100 bases, such as Illumina), then the ratio parameter can be set to r=[0.23,0.27].
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
59 If the sequencing technology has a high indel error rate (1-2 indels per 100 bases, such as 454 or Ion Torrent),
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
60 then the ratio parameter can be set to r=[0.13,0.17]."/>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
61 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
62 </conditional>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
63 <param format="fasta,fastq" name="input_reads" type="data" label="Querying sequences (reads)" help=""/>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
64
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
65 <conditional name="sequencing_type">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
66 <param name="sequencing_type_selector" type="select" label="Sequencing type">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
67 <option value="not_paired">Reads are not paired</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
68 <option value="paired">Reads are paired</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
69 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
70 <when value="paired">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
71 <param name="paired_type" type="select" label="If one read of a pair is accepted and the other not, output both reads" display="radio"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
72 help="SortMeRNA does not use the pairing information for filtering RNA,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
73 however if one read of a pair is accepted and the other is not,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
74 the resulting output may break apart the pair into two separate files.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
75 The purpose of 'Reads are paired' option is to preserve the pairing of the reads.">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
76 <option value="--paired-in">to accepted file</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
77 <option value="--paired-out">to rejected file</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
78 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
79 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
80 </conditional>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
81
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
82 <param name="strand_search" type="select" label="Which strands to search" display="radio">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
83 <option value="">Search both strands</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
84 <option value="-F">Search only the forward strand</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
85 <option value="-R">Search only the reverse-complementary strand</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
86 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
87
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
88 <conditional name="databases_type">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
89 <param name="databases_selector" type="select" label="Databases to query"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
90 help="Public rRNA databases provided with SortMeRNA have been indexed.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
91 On the contrary, personal databases must be indexed each time SortMeRNA is launched.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
92 Please be patient, this may take some time depending on the size of the given database.">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
93 <option value="cached" selected="true">Public ribosomal databases</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
94 <option value="history">Databases from your history</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
95 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
96 <when value="cached">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
97 <param name="input_databases" label="rRNA database"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
98 type="select" display="checkboxes" multiple="true">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
99 <options from_data_table="rRNA_databases" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
100 <validator type="no_options" message="Select at least one database"/>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
101 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
102 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
103 <when value="history">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
104 <repeat name="input_databases" title="Database" min="1">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
105 <param name="database_name" type="data" format="fasta" label="rRNA database"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
106 help="Your database will be indexed first, which may take up to several minutes."/>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
107 </repeat>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
108 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
109 </conditional>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
110
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
111 <!-- Outputs -->
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
112 <param name="outputs_selected" type="select" display="checkboxes" multiple="true" label="Output options">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
113 <option value="accept" selected="True">Reads matching to at least one database</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
114 <option value="other">Reads not found in any database</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
115 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
116 <param name="log" type="boolean" checked="False" truevalue="--log log_file" falsevalue="" label="Statistics file"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
117 help="Generates statistics for the rRNA content of reads, as well as rRNA subunit distribution.">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
118 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
119
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
120 <!-- Advanced options -->
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
121 <conditional name="options">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
122 <param name="options_type_selector" type="select" label="Advanced Options">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
123 <option value="less" selected="True">Less options</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
124 <option value="more">More options</option>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
125 </param>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
126 <when value="less">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
127 <!-- no options -->
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
128 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
129 <when value="more">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
130 <param name="number_of_threads" type="integer" label="Number of threads to use" value="1" min="1"/>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
131 </when>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
132 </conditional>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
133 </inputs>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
134 <outputs>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
135 <data format="input" format_source="input_reads" name="output_accept" from_work_dir="accept_file.dat"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
136 label="Matching reads on ${on_string} (${input_reads.datatype.file_ext})">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
137 <filter>outputs_selected and 'accept' in outputs_selected</filter>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
138 </data>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
139 <data format="input" format_source="input_reads" name="output_other" from_work_dir="other_file.dat"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
140 label="Reads not found on ${on_string} (${input_reads.datatype.file_ext})">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
141 <filter>outputs_selected and 'other' in outputs_selected</filter>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
142 </data>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
143 <data format="txt" name="output_log" label="${tool.name} statistics (txt)" from_work_dir="log_file.log">
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
144 <filter>log</filter>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
145 </data>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
146 </outputs>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
147 <stdio>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
148 <regex match="This program builds a Burst trie on an input rRNA database"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
149 source="both"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
150 level="fatal"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
151 description="Buildtrie program failed to execute." />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
152 <regex match="The database name"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
153 source="both"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
154 level="fatal"
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
155 description="The database ${databases} has not been preprocessed using buildtrie before using SortMeRNA." />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
156 </stdio>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
157 <tests>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
158 <test>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
159 <param name="read_family_selector" value="I" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
160 <param name="input_reads" value="sortmerna_wrapper_in1.fastq" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
161 <param name="sequencing_type_selector" value ="not_paired" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
162 <param name="strand_search" value="" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
163 <param name="databases_selector" value="cached" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
164 <param name="input_databases" value="rfam-5.8s,rfam-5s" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
165 <param name="outputs_selected" value="accept,other" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
166 <param name="log" value="" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
167 <param name="options_type_selector" value="less" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
168 <output name="output_accept" file="sortmerna_wrapper_accept1.fastq" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
169 <output name="output_other" file="sortmerna_wrapper_other1.fastq" />
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
170 </test>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
171 </tests>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
172 <help>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
173 **Overview**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
174
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
175 SortMeRNA_ is a software designed to rapidly filter ribosomal RNA fragments
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
176 from metatransriptomic data produced by next-generation sequencers.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
177 It is capable of handling large RNA databases and sorting out all fragments
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
178 matching to the database with high accuracy and specificity.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
179
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
180 .. _SortMeRNA: http://bioinfo.lifl.fr/RNA/sortmerna/
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
181
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
182 If you use this tool, please cite Kopylova E., Noé L. and Touzet H.,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
183 `"SortMeRNA: Fast and accurate filtering of ribosomal RNAs in metatranscriptomic data"`__,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
184 Bioinformatics (2012), doi: 10.1093/bioinformatics/bts611.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
185
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
186 .. __: http://bioinformatics.oxfordjournals.org/content/28/24/3211
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
187
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
188 ------
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
189
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
190 **Input**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
191
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
192 The input is one file of reads in FASTA or FASTQ format and any number of rRNA databases to search against.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
193 If the user has two foward-reverse paired-sequencing reads files, they may use
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
194 the script "merge_paired_reads.sh" to interleave the reads into one file, preserving their order.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
195
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
196 If the sequencing type for the reads is paired-ended, the user has two options under
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
197 "Sequencing type" to filter the reads and preserve their order in the file.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
198 For a further example of each option, please refer to Section 4.2.3 in the `SortMeRNA User Manual`_.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
199
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
200 .. _sortmerna user manual: http://bioinfo.lifl.fr/RNA/sortmerna/code/SortMeRNA-user-manual-v1.7.pdf
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
201
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
202 ------
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
203
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
204 **Output**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
205
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
206 The output will follow the same format (FASTA or FASTQ) as the reads.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
207
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
208 In the standalone version of SortMeRNA, the user may output the matching reads in a separate file per database (--bydbs option). This option will be made available in a future version of Galaxy.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
209
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
210 ------
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
211
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
212 **rRNA databases**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
213
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
214 SortMeRNA is distributed with 8 representative rRNA databases, which were
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
215 all constructed from the SILVA SSU,LSU (version 111) and the RFAM 5/5.8S
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
216 (version 11.0) databases using the tool UCLUST.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
217
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
218 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
219 | Representative database | id % | avergage id% | # seq | Origin | # seq | filtered to remove |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
220 +==========================+======+==============+=======+========================+========+====================+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
221 | SILVA 16S bacteria | 85 | 91.6 | 8174 | SILVA SSU Ref NR v.111 | 244077 | 23s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
222 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
223 | SILVA 16S archaea | 95 | 96.7 | 3845 | SILVA SSU Ref NR v.111 | 10919 | 23s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
224 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
225 | SILVA 18S eukarya | 95 | 96.7 | 4512 | SILVA SSU Ref NR v.111 | 31862 | 26s,28s,23s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
226 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
227 | |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
228 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
229 | SILVA 23S bacteria | 98 | 99.4 | 3055 | SILVA LSU Ref v.111 | 19580 | 16s,26s,28s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
230 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
231 | SILVA 23s archaea | 98 | 99.5 | 164 | SILVA LSU Ref v.111 | 405 | 16s,26s,28s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
232 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
233 | SILVA 28S eukarya | 98 | 99.1 | 4578 | SILVA LSU Ref v.111 | 9321 | 18s |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
234 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
235 | |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
236 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
237 | Rfam 5S archaea/bacteria | 98 | 99.2 | 59513 | RFAM | 116760 | |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
238 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
239 | Rfam 5.8S eukarya | 98 | 98.9 | 13034 | RFAM | 225185 | |
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
240 +--------------------------+------+--------------+-------+------------------------+--------+--------------------+
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
241
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
242
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
243 id % :
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
244 members of the cluster must have identity at least 'id %' identity with the representative sequence
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
245
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
246 average id % :
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
247 average identity of a cluster member to the representative sequence
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
248
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
249 The user may also choose to use their own rRNA databases.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
250
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
251 .. class:: warningmark
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
252
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
253 Note that your personal databases are indexed each time, and that
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
254 this may take some time depending on the size of the given database.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
255
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
256 ------
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
257
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
258 **SortMeRNA parameter list**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
259
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
260 The standalone, command-line version of SortMeRNA uses the following parameters.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
261
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
262 For indexing (buildtrie):
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
263
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
264 This program builds a Burst trie on an input rRNA database file in fasta format
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
265 and stores the material in binary files under the folder '/automata'::
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
266
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
267 ./buildtrie --db [path to rrnas database file name {.fasta}] {OPTIONS}
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
268
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
269 The list of OPTIONS can be left blank, the default values will be used::
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
270
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
271 -L length of the sliding window (the seed)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
272 (default: 18)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
273
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
274 -F search only the forward strand
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
275 -R search only the reverse-complementary strand
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
276 (default: both strands are searched)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
277
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
278 -h help
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
279
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
280
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
281
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
282
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
283 For sorting (sortmerna):
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
284
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
285 To run SortMeRNA, type in any order after 'sortmerna'::
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
286
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
287 --I [illumina reads file name {fasta/fastq}]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
288
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
289 --454 [roche 454 reads file name {fasta/fastq}]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
290
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
291 -n number of databases to use (must precede --db)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
292
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
293 --db [rrnas database name(s)]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
294
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
295 One database,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
296 ex 1. -n 1 --db /path1/database1.fasta
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
297
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
298 Multiple databases,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
299 ex 2. -n 2 --db /path2/database2.fasta /path3/database3.fasta
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
300
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
301 {OPTIONS}
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
302
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
303 The list of OPTIONS can be left blank, the default values will be used::
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
304
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
305 --accept [accepted reads file name]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
306 --other [rejected reads file name]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
307 (default: no output file is created)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
308
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
309 --bydbs output the accepted reads by database
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
310 (default: concatenated file of reads)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
311
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
312 --log [overall statistics file name]
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
313 (default: no statistics file created)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
314
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
315 --paired-in put both paired-end reads into --accept file
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
316 --paired-out put both paired-end reads into --other file
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
317 (default: if one read is accepted and the other is not,
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
318 separate the reads into --accept and --other files)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
319
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
320 -r ratio of the number of hits on the read / read length
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
321 (default Illumina: 0.25, Roche 454: 0.15)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
322
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
323 -F search only the forward strand
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
324 -R search only the reverse-complementary strand
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
325 (default: both strands are searched)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
326
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
327 -a number of threads to use
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
328 (default: 1)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
329
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
330 -m (m x 4096 bytes) for loading the reads into memory
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
331 ex. '-m 4' means 4*4096 = 16384 bytes will be allocated for the reads
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
332 note: maximum -m is 1020039
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
333 (default: m = 262144 = 1GB)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
334
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
335 -v verbose
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
336 (default: deactivated)
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
337
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
338 -h help
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
339
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
340 --version version number
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
341
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
342 ------
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
343
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
344 **Bibliography**
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
345
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
346 [1] Quast C, Pruesse E, Yilmaz P, Gerken J, Schweer T, Yarza P, Peplies J, Glöckner FO (2013) The SILVA ribosomal RNA gene database project: improved data processing and web-based tools, Nucleic Acids Research, 41 (D1): D590-D596.
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
347
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
348 [2] Rfam 11.0: 10 years of RNA families. S.W. Burge, J. Daub, R. Eberhardt, J. Tate, L. Barquist, E.P. Nawrocki, S.R. Eddy, P.P. Gardner, A. Bateman. Nucleic Acids Research (2012), doi: 10.1093/nar/gks1005
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
349
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
350 [3] Edgar, R.C. (2010) Search and clustering orders of magnitude faster than BLAST, Bioinformatics 26(19), 2460-2461, doi: 10.1093/bioinformatics/btq461
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
351
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
352 [4] Loman, N. J. and Misra, Raju V and Dallman, Timothy J and Constantinidou, Chrystala and Gharbia, Saheer E and Wain, John and Pallen, Mark J., Performance comparison of benchtop high-throughput sequencing platforms (2012), Nature Biotechnology, 30 (5). pp. 434-439
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
353 </help>
2e7f0da431e3 Uploaded version 1.0
bonsai
parents:
diff changeset
354 </tool>