5
|
1 <tool name="FastqToSam" id="picard_FastqToSam" version="1.126.0">
|
|
2 <description>convert Fastq data into unaligned BAM</description>
|
|
3 <requirements>
|
|
4 <requirement type="package" version="1.126.0">picard</requirement>
|
|
5 </requirements>
|
|
6
|
|
7 <macros>
|
|
8 <import>picard_macros.xml</import>
|
|
9 </macros>
|
|
10
|
|
11 <command>
|
|
12 @java_options@
|
|
13
|
|
14 java -jar \$JAVA_JAR_PATH/picard.jar
|
|
15 FastqToSam
|
|
16
|
|
17 #if str( $input_type.input_type_selector ) == "se":
|
|
18 FASTQ="${input_type.fastq}"
|
|
19 #elif str( $input_type.input_type_selector ) == "pe":
|
|
20 FASTQ="${input_type.fastq}"
|
|
21 FASTQ2="${input_type.fastq2}"
|
|
22 #else
|
|
23 FASTQ="${input_type.fastq.forward}"
|
|
24 FASTQ2="${input_type.fastq.reverse}"
|
0
|
25 #end if
|
5
|
26
|
|
27 QUALITY_FORMAT="${quality_format}"
|
|
28 OUTPUT="${outFile}"
|
0
|
29 READ_GROUP_NAME="${read_group_name}"
|
5
|
30 SAMPLE_NAME="${sample_name}"
|
|
31
|
|
32 #if str( $library_name ):
|
|
33 LIBRARY_NAME="${library_name}"
|
|
34 #end if
|
|
35
|
|
36 #if str( $platform_unit ):
|
|
37 PLATFORM_UNIT="${platform_unit}"
|
|
38 #end if
|
|
39
|
|
40 #if str( $platform ):
|
|
41 PLATFORM="${platform}"
|
|
42 #end if
|
|
43
|
|
44 #if str( $sequencing_center ):
|
|
45 SEQUENCING_CENTER="${sequencing_center}"
|
|
46 #end if
|
|
47
|
|
48 #if str( $predicted_insert_size ):
|
|
49 PREDICTED_INSERT_SIZE="${predicted_insert_size}"
|
0
|
50 #end if
|
5
|
51
|
|
52 #if str( $comment ):
|
|
53 COMMENT="${comment}"
|
|
54 #end if
|
|
55
|
|
56 #if str( $description ):
|
|
57 DESCRIPTION="${description}"
|
|
58 #end if
|
|
59
|
|
60 #if str( $run_date ):
|
|
61 RUN_DATE="${run_date}"
|
|
62 #end if
|
|
63
|
|
64 MIN_Q="${min_q}"
|
|
65 MAX_Q="${max_q}"
|
|
66 STRIP_UNPAIRED_MATE_NUMBER="${strip_unpairied_mate_number}"
|
|
67 ALLOW_AND_IGNORE_EMPTY_LINES="${allow_and_ignore_empty_lines}"
|
|
68
|
|
69 SORT_ORDER=coordinate
|
|
70 VALIDATION_STRINGENCY="${validation_stringency}"
|
|
71 QUIET=true
|
|
72 VERBOSITY=ERROR
|
|
73
|
0
|
74 </command>
|
|
75 <inputs>
|
5
|
76 <conditional name="input_type">
|
|
77 <param name="input_type_selector" type="select" label="What is your input data" help="Select between single end, paired end, and collections. See help below for full explanation of dataset types">
|
|
78 <option value="se">Single end (single dataset)</option>
|
|
79 <option value="pe">Paired end (two datasets)</option>
|
|
80 <option value="pc">Paired collection</option>
|
0
|
81 </param>
|
5
|
82 <when value="se">
|
|
83 <param name="fastq" type="data" format="fastq" label="Input fastq file for single end data" help="FASTQ"/>
|
0
|
84 </when>
|
5
|
85 <when value="pe">
|
|
86 <param name="fastq" type="data" format="fastq" label="Input fastq file for the first read in paired end data" help="FASTQ"/>
|
|
87 <param name="fastq2" type="data" format="fastq" label="Input fastq file for the second read of paired end data" help="FASTQ2"/>
|
|
88 </when>
|
|
89 <when value="pc">
|
|
90 <param name="fastq" type="data_collection" collection_type="paired" label="FASTQ paired dataset collection" help="FASTQ and FASTQ2; A collection of two datasets with forward and reverse reads. See help below on explanation of dataset collections"/>
|
0
|
91 </when>
|
|
92 </conditional>
|
5
|
93
|
|
94 <param name="quality_format" type="select" label="Select quality encoding scheme" help="QUALITY_FORMAT">
|
|
95 <option value="Standard" selected="True">Sanger (+33)</option>
|
|
96 <option value="Illumina">Illumina (+64)</option>
|
|
97 <option value="Solexa">Solexa (+66)</option>
|
|
98 </param>
|
|
99
|
|
100 <param name="read_group_name" type="text" size="20" value="A" label="Read group name" help="READ_GROUP_NAME"/>
|
|
101 <param name="sample_name" type="text" size="20" value="sample-a" label="Sample name" help="SAMPLE_NAME"/>
|
|
102 <param name="library_name" type="text" size="20" optional="True" label="The library name" help="LIBRARY_NAME; Optional"/>
|
|
103 <param name="platform_unit" type="text" size="20" optional="True" label="The platform unit (often run_barcode.lane)" help="PLATFORM_UNIT; Optional"/>
|
|
104 <param name="platform" type="text" size="20" optional="True" label="The platform type (e.g. illumina, 454)" help="PLATFORM; Optional"/>
|
|
105 <param name="sequencing_center" type="text" size="20" optional="True" label="The sequencing center from which the data originated" help="SEQUENCING_CENTER; Optional"/>
|
|
106
|
|
107 <param name="predicted_insert_size" type="integer" min="0" max="100000" optional="True" label="Predicted median insert size, to insert into the read group header" help="PREDICTED_INSERT_SIZE; Optional"/>
|
|
108 <param name="comment" type="text" size="20" optional="True" label="Comment to include in the output dataset's header" help="COMMENT; Optional"/>
|
|
109 <param name="description" type="text" size="20" optional="True" label="Optional description information" help="DESCRIPTION; Optional"/>
|
|
110 <param name="run_date" optional="True" type="text" label="Run date" help="RGDT; Optional; Format=YYYY-MM-DD (eg 1997-07-16)"/>
|
|
111 <param name="min_q" type="integer" value="0" min="0" max="100" label="Minimum quality allowed in the input fastq" help="MIN_Q; An exception will be thrown if a quality is less than this value; default=0"/>
|
|
112 <param name="max_q" type="integer" value="93" min="0" max="100" label="Minimum quality allowed in the input fastq" help="MAX_Q; An exception will be thrown if a quality is greater than this value; default=93"/>
|
|
113 <param name="strip_unpairied_mate_number" type="boolean" truevalue="true" falsevalue="false" label="If true and this is an unpaired fastq any occurance of '/1' will be removed from the end of a read name" help="STRIP_UNPAIRED_MATE_NUMBER; default=false"/>
|
|
114 <param name="allow_and_ignore_empty_lines" type="boolean" truevalue="true" falsevalue="false" label="Allow (and ignore) empty lines" help="ALLOW_AND_IGNORE_EMPTY_LINES; default=false"/>
|
|
115
|
|
116 <expand macro="VS" />
|
|
117
|
|
118 </inputs>
|
|
119
|
0
|
120 <outputs>
|
5
|
121 <data format="bam" name="outFile" label="${tool.name} on ${on_string}: reads as unaligned BAM"/>
|
0
|
122 </outputs>
|
5
|
123
|
0
|
124 <tests>
|
5
|
125 <test>
|
|
126 <param name="input_type_selector" value="pe" />
|
|
127 <param name="quality_format" value="Standard" />
|
|
128 <param name="read_group_name" value="A" />
|
|
129 <param name="sample_name" value="sample-a" />
|
|
130 <param name="library_name" value="A"/>
|
|
131 <param name="platform_unit" value="A"/>
|
|
132 <param name="platform" value="Illumina"/>
|
|
133 <param name="sequencing_center" value="A"/>
|
|
134 <param name="predicted_insert_size" value="300"/>
|
|
135 <param name="comment" value="A"/>
|
|
136 <param name="description" value="A"/>
|
|
137 <param name="run_date" value="2014-10-10"/>
|
|
138 <param name="min_q" value="0" />
|
|
139 <param name="max_q" value="93" />
|
|
140 <param name="strip_unpairied_mate_number" value="False" />
|
|
141 <param name="allow_and_ignore_empty_lines" value="False" />
|
|
142 <param name="validation_stringency" value="LENIENT"/>
|
|
143 <param name="fastq" value="picard_FastqToSam_read1.fq" ftype="fastq" />
|
|
144 <param name="fastq2" value="picard_FastqToSam_read2.fq" ftype="fastq" />
|
|
145 <output name="outFile" file="picard_FastqToSam_test1.bam" ftype="bam" lines_diff="4"/>
|
|
146 </test>
|
0
|
147 </tests>
|
5
|
148
|
|
149 <stdio>
|
|
150 <exit_code range="1:" level="fatal"/>
|
|
151 </stdio>
|
|
152
|
0
|
153 <help>
|
5
|
154
|
|
155 .. class:: infomark
|
|
156
|
|
157 **Purpose**
|
|
158
|
|
159 Computes a number of metrics that are useful for evaluating coverage and performance of whole genome sequencing experiments.
|
|
160
|
|
161 @dataset_collections@
|
|
162
|
|
163 @RG@
|
|
164
|
|
165 @description@
|
0
|
166
|
5
|
167 FASTQ=File
|
|
168 F1=File Input fastq file for single end data, or first read in paired end
|
|
169 data. Required.
|
|
170
|
|
171 FASTQ2=File
|
|
172 F2=File Input fastq file for the second read of paired end data (if used).
|
|
173
|
|
174 QUALITY_FORMAT=FastqQualityFormat
|
|
175 V=FastqQualityFormat A value describing how the quality values are encoded in the fastq. Either Solexa for
|
|
176 pre-pipeline 1.3 style scores (solexa scaling + 66), Illumina for pipeline 1.3 and above
|
|
177 (phred scaling + 64) or Standard for phred scaled scores with a character shift of 33.
|
|
178 If this value is not specified, the quality format will be detected automatically.
|
|
179 Default value: null. Possible values: {Solexa, Illumina, Standard}
|
0
|
180
|
5
|
181 READ_GROUP_NAME=String
|
|
182 RG=String Read group name Default value: A.
|
|
183
|
|
184 SAMPLE_NAME=String
|
|
185 SM=String Sample name to insert into the read group header Required.
|
|
186
|
|
187 LIBRARY_NAME=String
|
|
188 LB=String The library name to place into the LB attribute in the read group header.
|
|
189
|
|
190 PLATFORM_UNIT=String
|
|
191 PU=String The platform unit (often run_barcode.lane) to insert into the read group header.
|
|
192
|
|
193 PLATFORM=String
|
|
194 PL=String The platform type (e.g. illumina, solid) to insert into the read group header.
|
|
195
|
|
196 SEQUENCING_CENTER=String
|
|
197 CN=String The sequencing center from which the data originated.
|
|
198
|
|
199 PREDICTED_INSERT_SIZE=Integer
|
|
200 PI=Integer Predicted median insert size, to insert into the read group header.
|
|
201
|
|
202 COMMENT=String
|
|
203 CO=String Comment to include in the merged output file's header.
|
|
204
|
|
205 DESCRIPTION=String
|
|
206 DS=String Inserted into the read group header.
|
|
207
|
|
208 RUN_DATE=Iso8601Date
|
|
209 DT=Iso8601Date Date the run was produced, to insert into the read group header.
|
|
210
|
|
211 MIN_Q=Integer Minimum quality allowed in the input fastq. An exception will be thrown if a quality is
|
|
212 less than this value. Default value: 0.
|
|
213
|
|
214 MAX_Q=Integer Maximum quality allowed in the input fastq. An exception will be thrown if a quality is
|
|
215 greater than this value. Default value: 93.
|
|
216
|
|
217 STRIP_UNPAIRED_MATE_NUMBER=Boolean
|
|
218 If true and this is an unpaired fastq any occurance of '/1' will be removed from the end
|
|
219 of a read name. Default value: false. Possible values: {true, false}
|
|
220
|
|
221 ALLOW_AND_IGNORE_EMPTY_LINES=Boolean
|
|
222 Allow (and ignore) empty lines Default value: false. Possible values: {true, false}
|
|
223
|
0
|
224
|
5
|
225 @more_info@
|
0
|
226
|
5
|
227 </help>
|
|
228 </tool>
|
0
|
229
|
|
230
|