annotate je-demultiplex-illu.xml @ 7:370d9764f670 draft

planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit e217faa15f73427979bb212036cb130a14c59750
author gbcs-embl-heidelberg
date Mon, 05 Mar 2018 07:13:47 -0500
parents 69c77f9fc064
children 9dad3d0b27bc
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
01fdc6d10660 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit dd9e62bdb01d1252a90ce778103ce9b6b4a8cd52-dirty
gbcs-embl-heidelberg
parents: 0
diff changeset
1 <tool id="je_demultiplex_illu" name="Je-Demultiplex-Illu" version="@VERSION_STRING@">
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
2 <description>demultiplexes fastq files using Illumina Index file</description>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
3 <macros>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
4 <import>macros.xml</import>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
5 </macros>
5
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
6 <expand macro="requirements" />
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
7 <stdio>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
8 <exit_code range="1:" level="fatal" description="Tool exception" />
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
9 </stdio>
5
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
10 <expand macro="version_command" />
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
11 <command>
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
12 <![CDATA[
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
13 je demultiplex-illu
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
14
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
15 ## Fastq inputs
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
16 @single_or_paired_illu_cmd@
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
17
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
18 @barcode_option_cmd@
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
19
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
20 #if str($INTERNAL_BARCODES_CON.INTERNAL_BARCODES) == 'true':
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
21 BPOS=${INTERNAL_BARCODES_CON.BPOS}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
22 C=${INTERNAL_BARCODES_CON.CLIP_BARCODE}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
23 #if str( $INTERNAL_BARCODES_CON.LEN ) != "":
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
24 BCLEN=$INTERNAL_BARCODES_CON.LEN
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
25 #end if
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
26 #else:
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
27 BPOS=NONE
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
28 C=false
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
29 #end if
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
30
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
31 @common_options_cmd@
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
32
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
33 @demultiplexer_common_output_options_cmd@
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
34 @demultiplexer_common_outputs_cmd@
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
35 ]]>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
36 </command>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
37 <configfiles>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
38 <expand macro="barcode_config_file"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
39 </configfiles>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
40 <inputs>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
41 <!-- single/paired - similar to macro 'single_or_paired_general' -->
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
42 <expand macro="single_or_paired_illu">
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
43 <expand macro="demultiplex_illu_paired_end_options"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
44 </expand>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
45 <expand macro="barcode_option"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
46 <conditional name="INTERNAL_BARCODES_CON">
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
47 <param name="INTERNAL_BARCODES" type="select"
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
48 label="Do your reads contain Unique Molecular Identifiers(UMIs)">
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
49 <option value="true">Yes</option>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
50 <option value="false" selected="true">No</option>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
51 </param>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
52 <when value="true">
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
53 <param name="BPOS" type="select" label="Barcode read position (BPOS)" help="where are the barcodes.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
54 If not using paired-end it does not matter what you specify here.">
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
55 <option value="READ_1" selected="true">READ_1 (beginning of read from the first fastq file)</option>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
56 <option value="READ_2">READ_2 (beginning of read from the second fastq file)</option>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
57 <option value="BOTH">BOTH (beginning of both reads)</option>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
58 </param>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
59 <expand macro="barcode_len_option"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
60 <expand macro="clip_barcode"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
61 </when>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
62 <when value="false"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
63 </conditional>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
64
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
65 <expand macro="demultiplexer_common_options"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
66
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
67 <expand macro="common_options"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
68
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
69 <expand macro="demultiplexer_common_output_options"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
70
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
71 </inputs>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
72 <outputs>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
73 <expand macro="demultiplexer_common_outputs"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
74 </outputs>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
75
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
76 <tests>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
77 <test>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
78 <!-- barcode at both ends, non-redundant -->
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
79 <param name="type" value="paired"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
80 <param name="input_1" value="illu_file_1_sequence.txt" ftype="fastqsanger"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
81 <param name="input_2" value="illu_file_2_sequence.txt" ftype="fastqsanger"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
82 <param name="I1" value="illu_file_1_index.txt" ftype="fastqsanger"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
83 <param name="I2_AVAILABLE" value="true"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
84 <param name="I2" value="illu_file_2_index.txt" ftype="fastqsanger"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
85
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
86 <param name="INTERNAL_BARCODES" value="true"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
87 <param name="barcode_list_type_con" value="file"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
88 <param name="BARCODE_FILE" value="illu_dualindexing.txt" ftype="tabular"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
89 <param name="LEN" value="8:8"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
90 <param name="ZT" value="5:6"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
91 <param name="BPOS" value="BOTH"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
92 <param name="BM" value="BOTH"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
93 <param name="BRED" value="false"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
94 <param name="MM" value="3"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
95 <param name="MMD" value="2"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
96 <param name="Q" value="20"/>
5
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
97 <param name="DIAG" value="false"/>
7
370d9764f670 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit e217faa15f73427979bb212036cb130a14c59750
gbcs-embl-heidelberg
parents: 5
diff changeset
98 <output name="METRICS_FILE_NAME" file="illu_summary_PE.txt" ftype="tabular" lines_diff="4"/>
370d9764f670 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit e217faa15f73427979bb212036cb130a14c59750
gbcs-embl-heidelberg
parents: 5
diff changeset
99 <output name="DEMULTIPLEX_RESULTS" ftype="tabular">
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
100 <discovered_dataset designation="unassigned_1" file="illu_unassigned_1_PE.txt" />
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
101 <discovered_dataset designation="unassigned_2" file="illu_unassigned_2_PE.txt" />
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
102 <discovered_dataset designation="emb681m5_GGACTCCTCTCTCTAT_2" file="emb681m5_GGACTCCTCTCTCTAT_2.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
103 <discovered_dataset designation="emb681m5_GGACTCCTCTCTCTAT_1" file="emb681m5_GGACTCCTCTCTCTAT_1.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
104 <discovered_dataset designation="emb681m4_TCCTGAGCCTCTCTAT_2" file="emb681m4_TCCTGAGCCTCTCTAT_2.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
105 <discovered_dataset designation="emb681m4_TCCTGAGCCTCTCTAT_1" file="emb681m4_TCCTGAGCCTCTCTAT_1.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
106 <discovered_dataset designation="emb681m1_TAAGGCGACTCTCTAT_2" file="emb681m1_TAAGGCGACTCTCTAT_2.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
107 <discovered_dataset designation="emb681m1_TAAGGCGACTCTCTAT_1" file="emb681m1_TAAGGCGACTCTCTAT_1.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
108 <discovered_dataset designation="emb6801m2_AGGCAGAATAGATCGC_2" file="emb6801m2_AGGCAGAATAGATCGC_2.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
109 <discovered_dataset designation="emb6801m2_AGGCAGAATAGATCGC_1" file="emb6801m2_AGGCAGAATAGATCGC_1.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
110 <discovered_dataset designation="emb6801m1_CGTACTAGTAGATCGC_2" file="emb6801m1_CGTACTAGTAGATCGC_2.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
111 <discovered_dataset designation="emb6801m1_CGTACTAGTAGATCGC_1" file="emb6801m1_CGTACTAGTAGATCGC_1.txt"/>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
112 </output>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
113 </test>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
114 </tests>
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
115
5
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
116 <help>
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
117 <![CDATA[
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
118 **What it does**
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
119
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
120 Je demultiplex-illu: demultiplex fastq files using Illumina Index files,
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
121 with optional handling of Unique Molecular Identifiers for further use in 'markdupes' module
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
122 Input files are fastq files, and can be in gzip compressed format.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
123
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
124 Author: Charles Girardot (charles.girardot@embl.de).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
125
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
126 Wrapper by: Jelle Scholtalbers (jelle.scholtalbers@embl.de).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
127
7
370d9764f670 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit e217faa15f73427979bb212036cb130a14c59750
gbcs-embl-heidelberg
parents: 5
diff changeset
128 With contributions by: Mehmet Tekman (@mtekman)
370d9764f670 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit e217faa15f73427979bb212036cb130a14c59750
gbcs-embl-heidelberg
parents: 5
diff changeset
129
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
130 ------
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
131
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
132 **Know what you are doing**
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
133
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
134 .. class:: warningmark
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
135
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
136 You will want to read the `documentation`__.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
137
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
138 .. __: http://gbcs.embl.de/portal/Je
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
139
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
140 ------
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
141
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
142 **Parameter list**
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
143
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
144 This is an exhaustive list of options::
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
145
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
146 FASTQ_FILE1=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
147 F1=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
148
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
149 Input fastq file (optionally gzipped) for single end data, or first read in paired end
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
150 data.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
151
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
152 Required.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
153
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
154 FASTQ_FILE2=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
155 F2=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
156
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
157 Input fastq file (optionally gzipped) for the second read of paired end data.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
158
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
159 Default value: null.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
160
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
161 INDEX_FILE1=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
162 I1=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
163
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
164 Fastq file for index 1 (barcode) reads, optionally gzipped
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
165
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
166 Required.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
167
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
168 INDEX_FILE2=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
169 I2=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
170
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
171 Fastq file for index 2 (barcode) reads, optionally gzipped.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
172 A INDEX_FILE1 MUST be provided when INDEX_FILE2 is given. This situation corresponds to
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
173 Illumina dual indexing.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
174
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
175 Default value: null.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
176
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
177 BARCODE_FILE=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
178 BF=File
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
179
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
180 Barcode file describing sequence list and sample names. Tab-delimited file with 2
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
181 columns, with the sample in col1 and the corresponding barcode in col2.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
182 Simple barcode file format : 2 tab-delimited colums
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
183 If multiple barcode map to the same sample, either line can be duplicated e.g.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
184 sample1 ATAT
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
185 sample1 GAGG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
186 sample2 CCAA
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
187 sample2 TGTG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
188 Or barcodes can be combined using the OR operator '|' i.e. the file above can be
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
189 re-written like
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
190 sample1 ATAT|GAGG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
191 sample2 CCAA|TGTG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
192 Finally, for the special situation of paired-end data in which barcodes differ at both
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
193 ends (ie BPOS=BOTH BRED=false BM=BOTH , see BRED option description), barcodes for read_1
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
194 and read_2 can be distinguished using a ':' separator i.e.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
195 sample1 ATAT:GAGG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
196 sample2 CCAA:TGTG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
197 This above syntax means that sample 1 is encoded with ATAT barcode at read_1 AND GAGG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
198 barcode at read_2. Note that you can still combine barcodes using | e.g.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
199 sample1 ATAT|GAGG:CCAA|TGTG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
200 would mean that sample 1 is mapped by the combination of barcode: ATAT OR GAGG at read_1
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
201 AND CCAA OR TGTG at read_2.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
202 Extended barcode file format : 3 (single-end) or 4 (paired-end) tab-delimited colums
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
203 same as the simple barcode file format but the extra columns contains the file name(s)
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
204 to use to name output files. A unique extra column is expected for single-end while 2
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
205 extra columns are expected for paired-end. In case, lines are duplicated (multiple
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
206 barcodesmapping the same sample), the same file name should be indicated in the third
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
207 (and fourth) column(s).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
208 sample1 ATAT spl1_1.txt.gz spl1_2.txt.gz
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
209 sample1 GAGG spl1_1.txt.gz spl1_2.txt.gz
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
210 sample2 CCAA spl2_1.txt.gz spl2_2.txt.gz
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
211 Or
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
212 sample1 ATAT|GAGG:CCAA|TGTG spl1_1.txt.gz spl1_2.txt.gz
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
213 Ns in barcode sequence are allowed and are used to flag positions that should be ignored
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
214 in sample matching
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
215 i.e. they will be clipped off the read sequence (like in iCLIP protocol).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
216
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
217 Required.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
218
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
219 BARCODE_READ_POS=BarcodePosition
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
220 BPOS=BarcodePosition
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
221
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
222 Indicates the location of additional barcodes present in the read(s). Setting this option
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
223 implies setting the LEN option.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
224 Importantly, these additional barcodes must not encode sample identity information but
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
225 used for e.g. molecular barcoding (UMIs) or for any purpose other than sample identity encoding.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
226
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
227 Default value: BOTH. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
228 Possible values: {READ_1, READ_2, BOTH, NONE}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
229
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
230 BCLEN=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
231 LEN=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
232
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
233 Length of the barcode sequences, optional. Taken from barcode file when not given.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
234 In situations where BARCODE_READ_POS == BOTH AND REDUNDANT_BARCODES=false, two distinct
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
235 length can be provided using the syntax LEN=X:Z where X and Z are 2 integers representing
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
236 the barcode length for read_1 and read_2 respectively.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
237
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
238 Default value: null
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
239
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
240 REDUNDANT_BARCODES=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
241 BRED=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
242
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
243 This option only applies for paired-end data with *both* INDEX_FILE1 and INDEX_FILE2
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
244 provided.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
245 Indicates if both index barcodes encode redundant information i.e. if both barcodes are
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
246 supposed to be identical (or resolve to the same sample when a pool of barcodes is used
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
247 per sample).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
248 When BRED=true, the STRICT option guides the sample lookup behavior When BRED=false,
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
249 barcodes are combined prior to sample lookup.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
250
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
251 Default value: true. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
252 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
253
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
254 STRICT=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
255 S=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
256
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
257 For paired-end data and when two distinct barcodes/indices are used to encode samples,
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
258 this option tells if both barcodes should resolve to the same sample.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
259 When true and if only one of the two reads has a barcode match, the read pair is
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
260 'unassigned'.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
261 When false and if only one of the two reads has a barcode match, the read pair is
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
262 assigned to the
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
263 corresponding sample
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
264 When reads resolve to different samples, the read pair is always 'unassigned'.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
265
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
266 Default value: false. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
267 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
268
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
269 MAX_MISMATCHES=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
270 MM=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
271
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
272 Maximum mismatches for a barcode to be considered a match. In situations where both
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
273 barcodes are used for sample matching i.e. BPOS=BOTH BM=BOTH (or 2 INDEX_FILE given), two
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
274 distinct
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
275 values can be given here using the syntax MM=X:Z where X and Z are 2 integers to use for
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
276 read_1 and read_2 respectively.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
277 MM=null is like MM=0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
278
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
279 Default value: 1. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
280
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
281 MIN_MISMATCH_DELTA=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
282 MMD=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
283
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
284 Minimum difference between the number of mismatches against the best and the second best
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
285 barcode. When MMD is not respected, the read remains unassigned.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
286 When two distinct barcodes are used for sample matching (dual encoding), two distinct
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
287 values can be given using the syntax MMD=X:Z where X and Z are 2 integers to use for
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
288 first (e.g. from read_1 or index_1)
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
289 MMD=null is like MMD=0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
290
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
291 Default value: 1. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
292
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
293 MIN_BASE_QUALITY=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
294 Q=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
295
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
296 Minimum base quality during barcode matching: bases which quality is less than this
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
297 cutoff are always considered as a mismatch.When two distinct barcodes are used for sample
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
298 matching (dual encoding), two distinct values can be given using the syntax Q=X:Z where X
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
299 and Z are 2 integers to use for first (e.g. from read_1 or index_1) and second barcode
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
300 (e.g. from read_2 or index_2) respectively.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
301 Q=null is like Q=0.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
302
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
303 Default value: 10. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
304
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
305 XTRIMLEN=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
306 XT=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
307
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
308 Optional extra number of base to be trimmed right after the barcode (only used if
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
309 CLIP_BARCODE=true).
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
310 When running paired-end, two distinct values can be given using the syntax XT=X:Z where X
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
311 and Z are 2 integers to use for read_1 and read_2 respectively. Note that even when
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
312 BPOS=READ_1 or BPOS=READ_2, a X:Y synthax can be given to trim the read w/o barcode as to
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
313 end up with reads of the same length (note that this can also be operated using ZT). If a
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
314 unique value is given, e.g. XT=1, while running paired-end the following rule applies:
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
315 (1) BPOS=READ_1 or BPOS=READ_2, no trim is applied at the read w/o barcode
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
316 (2) BPOS=BOTH, the value is used for both reads.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
317
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
318 Note that XT=null is like XT=0.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
319 Default value: 0. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
320
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
321 ZTRIMLEN=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
322 ZT=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
323
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
324 Optional extra number of bases to be trimmed from the read end i.e. 3' end.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
325 When running paired-end, two distinct values can be given here using the syntax ZT=X:Z
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
326 where X and Z are 2 integers to use for read_1 and read_2 respectively. Note that even
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
327 when BPOS=READ_1 or BPOS=READ_2, a X:Y synthax can be given to trim the read w/o barcode
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
328 as to end up with reads of the same length (note that this can also be operated using
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
329 XT). Note that if a single value is passed, the value always applies to both reads in
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
330 paired-end mode without further consideration.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
331 ZT=null is like ZT=0.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
332
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
333 Default value: 0. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
334
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
335 CLIP_BARCODE=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
336 C=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
337
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
338 Clip barcode sequence from read sequence, as well as XTRIMLEN (and ZTRIMLEN) bases if
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
339 applicable, before writing to output file.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
340 If false, reads are written without modification to output file.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
341 Apply to both barcodes when BPOS=BOTH.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
342
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
343 Default value: true. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
344 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
345
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
346 ADD_BARCODE_TO_HEADER=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
347 ADD=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
348
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
349 Add matched barcode at the end of the read header. Applies to both index when INDEX_FILE2
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
350 is also provided.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
351 First the sample encoding barcodes from I1 (and I2 when relevant) are added to the read
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
352 headers like
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
353 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 2:N:0:I1_BARCODE:I2_BARCODE
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
354 Then, if BPOS!=NONE, the additional barcodes (UMIs) clipped from the read(s) are added
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
355 to their own header, like
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
356 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 2:N:0:I1_BARCODE:I2_BARCODE:CLIPPED_SEQ_FROMREAD
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
357
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
358 Default value: true. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
359 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
360
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
361 ENSURE_IDENTICAL_HEADER_NAMES=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
362 SAME_HEADERS=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
363
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
364 Makes sure that headers of both reads of a pair are identical, using the following read
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
365 header pattern (for both reads of a pair):
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
366 @D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 I1_BARCODE:I2_BARCODE(:CLIPPED_SEQ_FROMREAD1:CLIPPED_SEQ_FROMREAD2)
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
367 This option only makes sense in paired end mode and ADD=true. Some (if not all) mappers
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
368 will indeed complain when the read headers are not identical. When molecular barcodes are
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
369 present in reads and the RCHAR is used, you will end with (problematic) read headers like
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
370 this:
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
371 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:1:N:0:TAGAACAC:TGGAGTAG
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
372 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:3:N:0:TAGAACAC:CGTTGTAT
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
373 SAME_HEADERS=true will instead genetates the following identical header for both reads:
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
374 HISEQ:44:C6KC0ANXX:5:1101:1491:1994:TAGAACAC:TGGAGTAG:CGTTGTAT
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
375 Note that we also clipped the useless '1:N:0' and '3:N:0' has they will also result in
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
376 generating different headers
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
377 Important: this option will force RCHAR=: UNLESS you specify RCHAR=null ; in which
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
378 case a space will be preserved ie:
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
379 HISEQ:44:C6KC0ANXX:5:1101:1491:1994 TAGAACAC:TGGAGTAG:CGTTGTAT
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
380
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
381 Default value: true. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
382 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
383
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
384 READ_NAME_REPLACE_CHAR=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
385 RCHAR=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
386
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
387 Replace spaces in read name/header using provided character. This is particularly handy
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
388 when you need to retain ADDed barcode in read name/header during mapping (everything
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
389 after space in read name is usually clipped in BAM files). For example, with RCHAR=':':
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
390 '@D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965 2:N:0:'
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
391 becomes
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
392 '@D3FCO8P1:178:C1WLBACXX:7:1101:1836:1965:2:N:0:BARCODE'
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
393 Default value: null.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
394
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
395 QUALITY_FORMAT=FastqQualityFormat
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
396 V=FastqQualityFormat
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
397
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
398 A value describing how the quality values are encoded in the fastq. Either 'Solexa' for
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
399 pre-pipeline 1.3 style scores (solexa scaling + 66), 'Illumina' for pipeline 1.3 and
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
400 above (phred scaling + 64) or 'Standard' for phred scaled scores with a character shift
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
401 of 33. If this value is not specified (or 'null' is given), the quality format will be
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
402 detected.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
403
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
404 Default value: Standard. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
405 Possible values: {Solexa, Illumina, Standard}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
406
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
407 KEEP_UNASSIGNED_READ=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
408 UN=Boolean
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
409
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
410 Should un-assigned reads be saved in files or simply ignored. File names are
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
411 automatically created or can be given using UF1 & UF2 options.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
412
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
413 Default value: true. This option can be set to 'null' to clear the default value.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
414 Possible values: {true, false}
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
415
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
416 BARCODE_DIAG_FILE=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
417 DIAG=String
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
418
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
419 Name for a barcode match reporting file (not generated by default).Either a name (in
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
420 which case the file will be created in the output dir) or full path. This file will
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
421 contain a line per read pair with the barcode best matching the read subsequence or
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
422 'null' when no match is found according to matching parameters ; and the final selected
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
423 sample. This file is useful for debugging or further processing in case both ends are
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
424 barcoded.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
425 N.B: this file will have a size of about one of the fastq input files.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
426
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
427 Default value: null.
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
428 ]]>
5
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
429 </help>
69c77f9fc064 planemo upload for repository https://git.embl.de/grp-gbcs/Je/tree/master/src/galaxy commit 0eefd837333dae6fbecaf4f55b053268d844eff6
gbcs-embl-heidelberg
parents: 3
diff changeset
430 <expand macro="citations"/>
0
111ba1180318 Initial upload
gbcs-embl-heidelberg
parents:
diff changeset
431 </tool>