annotate tools/next_gen_conversion/solid2fastq.xml @ 0:9071e359b9a3

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:37:19 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 <tool id="solid2fastq" name="Convert">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2 <description>SOLiD output to fastq</description>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3 <command interpreter="python">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 #if $is_run.paired == "no" #solid2fastq.py --fr=$input1 --fq=$input2 --fout=$out_file1 -q $qual $trim_name $trim_first_base $double_encode
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 #elif $is_run.paired == "yes" #solid2fastq.py --fr=$input1 --fq=$input2 --fout=$out_file1 --rr=$input3 --rq=$input4 --rout=$out_file2 -q $qual $trim_name $trim_first_base $double_encode
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6 #end if#
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7 </command>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8 <inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 <param name="input1" type="data" format="csfasta" label="Select reads"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10 <param name="input2" type="data" format="qualsolid" label="Select qualities"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 <conditional name="is_run">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 <param name="paired" type="select" label="Is this a mate-pair run?">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 <option value="no" selected="true">No</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14 <option value="yes">Yes</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16 <when value="yes">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17 <param name="input3" type="data" format="csfasta" label="Select Reverse reads"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 <param name="input4" type="data" format="qualsolid" label="Select Reverse qualities"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19 </when>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 <when value="no">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21 </when>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22 </conditional>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 <param name="qual" label="Remove reads containing color qualities below this value" type="integer" value="0"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 <param name="trim_name" type="select" label="Trim trailing &quot;_F3&quot; and &quot;_R3&quot; ?">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25 <option value="-t" selected="true">Yes</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 <option value="">No</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 <param name="trim_first_base" type="select" label="Trim first base?">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 <option value="-f">Yes (BWA)</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 <option value="" selected="true">No (bowtie)</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 <param name="double_encode" type="select" label="Double encode?">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 <option value="-d">Yes (BWA)</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 <option value="" selected="true">No (bowtie)</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36 </inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 <outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38 <data format="fastqcssanger" name="out_file1"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 <data format="fastqcssanger" name="out_file2">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40 <filter>is_run['paired'] == 'yes'</filter>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 </data>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42 </outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43 <tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45 <param name="input1" value="fr.csfasta" ftype="csfasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46 <param name="input2" value="fr.qualsolid" ftype="qualsolid" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47 <param name="paired" value="no"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48 <param name="qual" value="0" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49 <param name="trim_first_base" value="No" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50 <param name="trim_name" value="No" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51 <param name="double_encode" value="No"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 <output name="out_file1" file="solid2fastq_out_1.fastq"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
55 <param name="input1" value="fr.csfasta" ftype="csfasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
56 <param name="input2" value="fr.qualsolid" ftype="qualsolid" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
57 <param name="paired" value="yes"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
58 <param name="input3" value="rr.csfasta" ftype="csfasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
59 <param name="input4" value="rr.qualsolid" ftype="qualsolid" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
60 <param name="qual" value="0" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
61 <param name="trim_first_base" value="No" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
62 <param name="trim_name" value="Yes" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
63 <param name="double_encode" value="No"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
64 <output name="out_file1" file="solid2fastq_out_2.fastq"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
65 <output name="out_file2" file="solid2fastq_out_3.fastq"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
66 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
67 </tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
68 <help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
69
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
70 **What it does**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
71
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
72 Converts output of SOLiD instrument (versions 3.5 and earlier) to fastq format suitable for bowtie, bwa, and PerM mappers.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
73
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
74 --------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
75
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
76 **Input datasets**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
77
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
78 Below are examples of forward (F3) reads and quality scores:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
79
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
80 Reads::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
81
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
82 >1831_573_1004_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
83 T00030133312212111300011021310132222
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
84 >1831_573_1567_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
85 T03330322230322112131010221102122113
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
86
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
87 Quality scores::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
88
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
89 >1831_573_1004_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
90 4 29 34 34 32 32 24 24 20 17 10 34 29 20 34 13 30 34 22 24 11 28 19 17 34 17 24 17 25 34 7 24 14 12 22
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
91 >1831_573_1567_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
92 8 26 31 31 16 22 30 31 28 29 22 30 30 31 32 23 30 28 28 31 19 32 30 32 19 8 32 10 13 6 32 10 6 16 11
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
93
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
94
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
95 **Mate pairs**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
96
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
97 If your data is from a mate-paired run, you will have additional read and quality datasets that will look similar to the ones above with one exception: the names of reads will be ending with &quot;_R3&quot;.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
98 In this case choose **Yes** from the *Is this a mate-pair run?* drop down and you will be able to select R reads. When processing mate pairs this tool generates two output files: one for F3 reads and the other for R3 reads.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
99 The reads are guaranteed to be paired -- mated reads will be in the same position in F3 and R3 fastq file. However, because pairing is verified it may take a while to process an entire SOLiD run (several hours).
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
100
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
101 ------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
102
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
103 **Explanation of parameters**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
104
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
105 **Remove reads containing color qualities below this value** - any read that contains as least one color call with quality lower than the specified value **will not** be reported.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
106
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
107 **Trim trailing &quot;_F3&quot; and &quot;_R3&quot;?** - does just that. Not necessary for bowtie. Required for BWA.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
108
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
109 **Trim first base?** - SOLiD reads contain an adapter base such as the first T in this read::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
110
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
111 >1831_573_1004_F3
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
112 T00030133312212111300011021310132222
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
113
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
114 this option removes this base leaving only color calls. Not necessary for bowtie. Required for BWA.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
115
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
116 **Double encode?** - converts color calls (0123.) to pseudo-nucleotides (ACGTN). Not necessary for bowtie. Required for BWA.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
117
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
118 ------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
119
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
120 **Examples of output**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
121
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
122 When all parameters are left &quot;as-is&quot; you will get this (using reads and qualities shown above)::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
123
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
124 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
125 T00030133312212111300011021310132222
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
126 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
127 %>CCAA9952+C>5C.?C79,=42C292:C(9/-7
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
128 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
129 T03330322230322112131010221102122113
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
130 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
131 );@@17?@=>7??@A8?==@4A?A4)A+.'A+'1,
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
132
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
133 Setting *Trim first base from reads* to **Yes** will produce this::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
134
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
135 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
136 00030133312212111300011021310132222
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
137 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
138 %>CCAA9952+C>5C.?C79,=42C292:C(9/-7
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
139 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
140 03330322230322112131010221102122113
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
141 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
142 );@@17?@=>7??@A8?==@4A?A4)A+.'A+'1,
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
143
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
144 Finally, setting *Double encode* to **Yes** will yield::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
145
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
146 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
147 TAAATACTTTCGGCGCCCTAAACCAGCTCACTGGGG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
148 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
149 %>CCAA9952+C>5C.?C79,=42C292:C(9/-7
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
150 @1831_573_1004
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
151 TATTTATGGGTATGGCCGCTCACAGGCCAGCGGCCT
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
152 +
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
153 );@@17?@=>7??@A8?==@4A?A4)A+.'A+'1,
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
154
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
155
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
156
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
157
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
158
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
159 </help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
160 </tool>