annotate cutadapt/cutadapt.xml @ 1:b4479aea41df draft

Uploaded
author jackcurragh
date Wed, 13 Apr 2022 09:38:42 +0000
parents
children 2767f70dfbd3
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
1 <tool id="cutadapt" name="Cutadapt" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="20.01">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
2 <description>Remove adapter sequences from FASTQ/FASTA</description>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
3 <macros>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
4 <import>macros.xml</import>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
5 </macros>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
6 <expand macro='edam_ontology' />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
7 <expand macro='xrefs'/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
8 <expand macro='requirements' />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
9 <version_command>cutadapt --version</version_command>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
10
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
11 <command detect_errors="exit_code"><![CDATA[
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
12 ## Link in the input and output files, so Cutadapt can tell their type
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
13
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
14 #import re
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
15 #set read1 = "input_f"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
16 #set read2 = "input_r"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
17 #set paired = False
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
18 #set library_type = str($library.type)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
19 #if $library_type == 'paired':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
20 #set paired = True
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
21 #set read1 = re.sub('[^\w\-\s]', '_', str($library.input_1.element_identifier))
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
22 #set read2 = re.sub('[^\w\-\s]', '_', str($library.input_2.element_identifier))
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
23 #set input_1 = $library.input_1
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
24 #set input_2 = $library.input_2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
25 #else if $library_type == 'paired_collection'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
26 #set paired = True
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
27 #set input_1 = $library.input_1.forward
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
28 #set input_2 = $library.input_1.reverse
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
29 #set read1 = re.sub('[^\w\-\s]', '_', str($library.input_1.name)) + "_1"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
30 #set read2 = re.sub('[^\w\-\s]', '_', str($library.input_1.name)) + "_2"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
31 #else
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
32 #set input_1 = $library.input_1
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
33 #set read1 = re.sub('[^\w\-\s]', '_', str($library.input_1.element_identifier))
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
34 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
35
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
36 #if $input_1.is_of_type("fastq.gz", "fastqsanger.gz"):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
37 #set ext = ".fq.gz"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
38 #else if $input_1.is_of_type("fastq.bz2", "fastqsanger.bz2"):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
39 #set ext = ".fq.bz2"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
40 #else if $input_1.is_of_type('fasta'):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
41 #set ext = ".fa"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
42 #else:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
43 #set ext = ".fq"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
44 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
45 #set read1 = $read1 + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
46 #set out1 = "out1" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
47 #set rest_output = "rest_output" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
48 #set wild_output = "wild_output" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
49 #set too_short_output = "too_short_output" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
50 #set too_long_output = "too_long_output" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
51 #set untrimmed_output = "untrimmed_output" + $ext
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
52 ln -f -s '${input_1}' '$read1' &&
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
53
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
54 #if $paired:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
55 #if $input_2.is_of_type("fastq.gz", "fastqsanger.gz"):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
56 #set ext2 = ".fq.gz"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
57 #else if $input_2.is_of_type("fastq.bz2", "fastqsanger.bz2"):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
58 #set ext2 = ".fq.gz"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
59 #else if $input_2.is_of_type('fasta'):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
60 #set ext2 = ".fa"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
61 #else:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
62 #set ext2 = ".fq"
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
63 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
64 #set read2 = $read2 + $ext2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
65 #set out2 = "out2" + $ext2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
66 #set too_short_paired_output = "too_short_paired_output" + $ext2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
67 #set too_long_paired_output = "too_long_paired_output" + $ext2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
68 #set untrimmed_paired_output = "untrimmed_paired_output" + $ext2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
69 ln -f -s '${input_2}' '$read2' &&
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
70 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
71
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
72 ## Run Cutadapt
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
73
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
74 #if 'multiple_output' in $output_selector:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
75 mkdir split &&
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
76 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
77
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
78 cutadapt
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
79
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
80 -j=\${GALAXY_SLOTS:-4}
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
81
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
82 #if 'json_stats' in $output_selector:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
83 --json stats.json
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
84 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
85
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
86 #if str( $library.type ) == "single":
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
87 @read1_options@
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
88 #if 'multiple_output' in $output_selector:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
89 --output='split/{name}.${input_1.ext}'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
90 #else:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
91 --output='$out1'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
92 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
93 #else:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
94 @read1_options@
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
95 @read2_options@
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
96 --output='$out1'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
97 --paired-output='$out2'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
98 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
99
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
100 --error-rate=$adapter_options.error_rate
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
101 --times=$adapter_options.times
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
102 --overlap=$adapter_options.overlap
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
103 $adapter_options.no_indels
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
104 $adapter_options.match_read_wildcards
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
105 --action=$adapter_options.action
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
106 $adapter_options.revcomp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
107
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
108 $filter_options.discard_trimmed
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
109 $filter_options.discard_untrimmed
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
110
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
111 #if str($filter_options.minimum_length) and str($filter_options.length_R2_options.length_R2_status) == 'True':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
112 --minimum-length=$filter_options.minimum_length:$filter_options.length_R2_options.R2_minimum
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
113 #else if str($filter_options.minimum_length):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
114 --minimum-length=$filter_options.minimum_length
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
115 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
116 #if str($filter_options.maximum_length) and str($filter_options.length_R2_options.length_R2_status) == 'True':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
117 --maximum-length=$filter_options.maximum_length:$filter_options.length_R2_options.R2_maximum
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
118 #else if str($filter_options.maximum_length):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
119 --maximum-length=$filter_options.maximum_length
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
120 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
121 #if str($filter_options.max_n):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
122 --max-n=$filter_options.max_n
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
123 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
124 #if str( $library.type ) != "single":
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
125 #if $filter_options.pair_filter:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
126 --pair-filter=$filter_options.pair_filter
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
127 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
128 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
129 #if str($filter_options.max_expected_errors):
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
130 --max-expected-errors=$filter_options.max_expected_errors
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
131 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
132 $filter_options.discard_cassava
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
133
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
134 #if str($read_mod_options.quality_cutoff) != '0':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
135 --quality-cutoff=$read_mod_options.quality_cutoff
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
136 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
137 #if str($read_mod_options.nextseq_trim) != '0':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
138 --nextseq-trim=$read_mod_options.nextseq_trim
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
139 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
140 $read_mod_options.trim_n
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
141 #if $read_mod_options.strip_suffix != ''
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
142 --strip-suffix $read_mod_options.strip_suffix
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
143 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
144 #if str($read_mod_options.shorten_options.shorten_values) == 'True':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
145 #if str($read_mod_options.shorten_options.shorten_end) == '3prime'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
146 --length=$read_mod_options.shorten_options.length
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
147 #else
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
148 --length=-$read_mod_options.shorten_options.length
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
149 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
150 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
151 #if str($read_mod_options.length_tag) != '':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
152 --length-tag='$read_mod_options.length_tag'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
153 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
154 #if str($read_mod_options.rename) != '':
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
155 --rename='$read_mod_options.rename'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
156 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
157 $read_mod_options.zero_cap
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
158
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
159
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
160 '${read1}'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
161 #if $paired:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
162 '${read2}'
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
163 #if $library.r2.quality_cutoff2:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
164 -Q=$library.r2.quality_cutoff2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
165 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
166 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
167
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
168 #if 'report' in $output_selector:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
169 > report.txt
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
170 #end if
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
171 ]]></command>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
172 <inputs>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
173
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
174 <!-- Reads -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
175 <conditional name="library">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
176 <param name="type" type="select" label="Single-end or Paired-end reads?">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
177 <option value="single">Single-end</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
178 <option value="paired">Paired-end</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
179 <option value="paired_collection">Paired-end Collection</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
180 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
181
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
182 <when value="single">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
183 <param name="input_1" format="@FASTQ_TYPES@" type="data" label="FASTQ/A file" help="Should be of datatype &quot;fastq.gz&quot; or &quot;fasta&quot;" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
184 <expand macro="single_end_options" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
185 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
186
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
187 <when value="paired">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
188 <param name="input_1" format="@FASTQ_TYPES@" type="data" label="FASTQ/A file #1" help="Should be of datatype &quot;fastq.gz&quot;or &quot;fasta&quot;" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
189 <param name="input_2" format="@FASTQ_TYPES@" type="data" label="FASTQ/A file #2" help="Should be of datatype &quot;fastq.gz&quot;or &quot;fasta&quot;" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
190 <expand macro="paired_end_options" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
191 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
192
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
193 <when value="paired_collection">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
194 <param name="input_1" format="@FASTQ_TYPES@" type="data_collection" collection_type="paired" label="Paired Collection" help="Should be of datatype &quot;fastq.gz&quot; or &quot;fasta&quot;" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
195 <expand macro="paired_end_options" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
196 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
197
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
198 </conditional>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
199
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
200 <!-- Adapter Options -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
201 <section name="adapter_options" title="Adapter Options">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
202 <param name="action" type="select" label="What to do if a match is found">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
203 <option value="trim" selected="True">Trim: trim adapter and upstream or downstream sequence</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
204 <option value="retain">Retain: the read is trimmed, but the adapter sequence is not removed</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
205 <option value="mask">Mask: mask adapters with 'N' characters instead of trimming them</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
206 <option value="lowercase">Lowercase: convert to lowercase</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
207 <option value="none">None: leave unchanged</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
208 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
209 <param name="internal" type="select" label="Disallow internal adaptor ocurrences" help="The non-internal 5’ and 3’ adapter types disallow internal occurrences of the adapter sequence. The adapter must always be at one of the ends of the read, but partial occurrences are also ok.">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
210 <option value="X">Enabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
211 <option value="" selected="True">Disabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
212 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
213 <param argument="--error-rate" type="float" min="0" max="1" value="0.1" label="Maximum error rate" help="Maximum allowed error rate (no. of errors divided by the length of the matching region)." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
214 <param argument="--no-indels" type="boolean" value="False" truevalue="--no-indels" falsevalue="" label="Do not allow indels (Use ONLY with anchored 5' (front) adapters)." help="Do not allow indels in the alignments. That is, allow only mismatches. This option is currently only supported for anchored 5' adapters ('^ADAPTER') (default: both mismatches and indels are allowed)." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
215 <param argument="--times" type="integer" min="1" value="1" label="Match times" help="Try to remove adapters at most COUNT times. Useful when an adapter gets appended multiple times." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
216 <param argument="--overlap" type="integer" min="1" value="3" label="Minimum overlap length" help="Minimum overlap length. If the overlap between the adapter and the sequence is shorter than LENGTH, the read is not modified. This reduces the number of bases trimmed purely due to short random adapter matches." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
217 <param name="match_read_wildcards" type="select" label="Match wildcards" help="Allow 'N's as matches. Default: in the adapters but not in the reads">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
218 <option value=" " selected="True">In the adapters but not in the reads</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
219 <option value="--match-read-wildcards">In the adapters and in the reads</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
220 <option value="--no-match-adapter-wildcards">Nowhere</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
221 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
222 <param argument="--revcomp" type="boolean" value="False" truevalue="--revcomp" falsevalue="" label="Look for adapters in the reverse complement" help="Check both the read and its reverse complement for adapter matches. If match is on reverse-complemented version, output that one. Default: check only read." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
223 </section>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
224
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
225 <!-- Filter Options -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
226 <section name="filter_options" title="Filter Options">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
227 <param argument="--discard-trimmed" type="boolean" value="False" truevalue="--discard-trimmed" falsevalue="" label="Discard Trimmed Reads" help="Discard reads that contain the adapter instead of trimming them. Use the 'Minimum overlap length' option in order to avoid throwing away too many randomly matching reads!" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
228 <param argument="--discard_untrimmed" type="boolean" value="False" truevalue="--discard-untrimmed" falsevalue="" label="Discard Untrimmed Reads" help="Discard reads that do not contain the adapter." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
229 <param argument="--minimum-length" type="integer" min="0" optional="True" value="25" label="Minimum length (R1)" help="Discard trimmed reads that are shorter than LENGTH. Reads that are too short even before adapter removal are also discarded." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
230 <param argument="--maximum-length" type="integer" min="0" optional="True" value="" label="Maximum length (R1)" help="Discard trimmed reads that are longer than LENGTH. Reads that are too long even before adapter removal are also discarded." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
231 <conditional name="length_R2_options">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
232 <param name="length_R2_status" type="select" label="Specify a minimum/maximum length for reverse reads (R2)" help="When trimming paired-end reads, the minimum/maximum lengths for R1 and R2 can be specified separately. If not provided, the same minimum length applies to both reads.">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
233 <option value="True">Enabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
234 <option value="False" selected="True">Disabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
235 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
236 <when value="True">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
237 <param name="R2_minimum" type="integer" min="0" value="" optional="True" label="Minimum length (R2)" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
238 <param name="R2_maximum" type="integer" min="0" value="" optional="True" label="Maximum length (R2)" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
239 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
240 <when value="False">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
241 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
242 </conditional>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
243 <param argument="--max-n" type="float" min="0" optional="True" label="Max N" help="Discard reads with more than this number of 'N' bases. A number between 0 and 1 is interpreted as a fraction of the read length." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
244 <param argument="--pair-filter" type="select" optional="True" label="Pair filter" help="Which of the reads in a paired-end read have to match the filtering criterion in order for the pair to be filtered. Default: any">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
245 <option value="any" selected="True">Any: a read pair is discarded (or redirected) if one of the reads (R1 or R2) fulfills the filtering criterion. </option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
246 <option value="both">Both: filtering criteria must apply to both reads in order for a read pair to be discarded. </option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
247 <option value="first">First: will make a decision about the read pair by inspecting whether the filtering criterion applies to the first read, ignoring the second read.</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
248
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
249 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
250 <param argument="--max-expected-errors" type="integer" min="0" optional="True" value="" label="Max expected errors" help="Discard reads whose expected number of errors (computed from quality values) exceeds this value." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
251 <param argument="--discard-cassava" type="boolean" truevalue="--discard-cassava" falsevalue="" checked="False" label="Discard CASAVA filtering" help="Discard reads that did not pass CASAVA filtering (header has :Y:)." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
252 </section>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
253
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
254 <!-- Read Modification Options -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
255 <section name="read_mod_options" title="Read Modification Options">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
256 <param argument="--quality-cutoff" type="text" value="0" label="Quality cutoff" help=" Trim low-quality bases from 5' and/or 3' ends of each read before adapter removal. Applied to both reads for paired-end data, unless a separate value for the second read is specified. If one value is given, only the 3' end is trimmed. If two comma-separated cutoffs are given, the 5' end is trimmed with the first cutoff, the 3' end with the second.">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
257 <sanitizer>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
258 <valid initial="string.digits"><add value="," /></valid>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
259 </sanitizer>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
260 <validator type="regex">[0-9,]+</validator>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
261 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
262 <param argument="--nextseq-trim" type="integer" value="0" label="NextSeq trimming" help="Experimental option for quality trimming of NextSeq data. This is necessary because that machine cannot distinguish between G and reaching the end of the fragment (it encodes G as ‘black’). This option works like regular quality trimming (where one would use -q 20 instead), except that the qualities of G bases are ignored." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
263 <param argument="--trim-n" type="boolean" truevalue="--trim-n" falsevalue="" checked="False" label="Trim Ns" help="Trim N's on ends of reads." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
264 <param argument="--strip-suffix" label="Strip suffix" type="text" help="Remove this suffix from read names if present." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
265 <conditional name="shorten_options">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
266 <param name="shorten_values" type="select" label="Shortening reads to a fixed length" help="If you want to remove a fixed number of bases from each read, use the –cut option instead.">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
267 <option value="True">Enabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
268 <option value="False" selected="True">Disabled</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
269 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
270 <when value="True">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
271 <param argument="--length" type="integer" value="0" label="Length" help="Shorten reads to this length. This modification is applied after adapter trimming." />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
272 <param name="shorten_end" type="select" label="End at which to apply the slice">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
273 <option value="3prime">3' ends</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
274 <option value="5prime">5' ends</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
275 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
276 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
277 <when value="False">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
278 </when>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
279 </conditional>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
280 <param argument="--length-tag" label="Length tag" type="text" optional="True" help="Search for TAG followed by a decimal number in the name of the read (description/comment field of the FASTA or FASTQ file). Replace the decimal number with the correct length of the trimmed read. For example, use --length-tag 'length=' to search for fields like 'length=123'." >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
281 <sanitizer invalid_char="">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
282 <valid initial="string.letters,string.digits">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
283 <add value="/" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
284 <add value="+" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
285 <add value="-" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
286 <add value="=" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
287 <add value=" " />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
288 <add value="_" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
289 </valid>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
290 </sanitizer>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
291 <validator type="regex">[A-Za-z0-9 =-_/+]+</validator>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
292 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
293 <param argument="--rename" label="Rename reads" type="text" optional="True" help="This option can be used to rename both single-end and paired-end reads. ">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
294 <sanitizer invalid_char="">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
295 <valid initial="string.letters,string.digits">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
296 <add value="{" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
297 <add value="}" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
298 <add value="_" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
299 <add value="=" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
300 <add value=" " />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
301 </valid>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
302 </sanitizer>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
303 <validator type="regex">[A-Za-z0-9 {}=_]+</validator>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
304 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
305 <param argument="--zero-cap" type="boolean" truevalue="--zero-cap" falsevalue="" checked="False" label="Change negative quality values to zero" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
306 </section>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
307
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
308 <!-- Output Options -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
309 <param name="output_selector" type="select" multiple="True" display="checkboxes" label="Outputs selector">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
310 <option value="report">Report: Cutadapt's per-adapter statistics. You can use this file with MultiQC.</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
311 <option value="info_file">Info file: write information about each read and its adapter matches.</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
312 <option value="rest_file">Rest of read: when the adapter matches in the middle of a read, write the rest (after the adapter).</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
313 <option value="wildcard_file">Wildcard file: when the adapter has wildcard bases (Ns) write adapter bases matching wildcard positions.</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
314 <option value="too_short_file">Too short reads: write reads that are too short according to minimum length specified (default: discard reads).</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
315 <option value="too_long_file">Too long reads: write reads that are too long (according to maximum length specified)</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
316 <option value="untrimmed_file">Untrimmed reads: write reads that do not contain the adapter to a separate file, instead of writing them to the regular output file (default: output to same file as trimmed)</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
317 <option value="multiple_output">Multiple output: create a separate file for each adapter trimmed (default: all trimmed reads are in a single file)</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
318 <option value="json_stats">Statistics in JSON format</option>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
319 </param>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
320 </inputs>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
321
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
322 <outputs>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
323 <data name="out1" format="fastqsanger" metadata_source="input_1" from_work_dir="out1*" label="${tool.name} on ${on_string}: Read 1 Output">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
324 <filter>library['type'] != 'paired_collection' and 'multiple_output' not in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
325 <expand macro="inherit_format_1" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
326 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
327
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
328 <data name="out2" format="fastqsanger" metadata_source="input_2" from_work_dir="out2*" label="${tool.name} on ${on_string}: Read 2 Output" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
329 <filter>library['type'] == 'paired' and 'multiple_output' not in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
330 <expand macro="inherit_format_2" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
331 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
332
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
333 <collection name="out_pairs" type="paired" format_source="input_1" label="${tool.name} on ${on_string}: Reads">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
334 <filter>library['type'] == 'paired_collection' and 'multiple_output' not in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
335 <data name="forward" from_work_dir="out1.fq*" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
336 <data name="reverse" from_work_dir="out2.fq*" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
337 </collection>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
338
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
339 <data name="report" format="txt" from_work_dir="report.txt" label="${tool.name} on ${on_string}: Report">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
340 <filter>output_selector and 'report' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
341 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
342 <data name="info_file" format="txt" metadata_source="input_1" label="${tool.name} on ${on_string}: Info File" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
343 <filter>output_selector and 'info_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
344 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
345
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
346 <data name="rest_output" format="fastqsanger" metadata_source="input_1" from_work_dir="rest_output*" label="${tool.name} on ${on_string}: Rest of Reads (R1 only)" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
347 <filter>output_selector and 'rest_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
348 <expand macro="inherit_format_1" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
349 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
350
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
351 <data name="wild_output" format="txt" metadata_source="input_1" from_work_dir="wild_output*" label="${tool.name} on ${on_string}: Wildcard File" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
352 <filter>output_selector and 'wildcard_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
353 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
354
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
355 <data name="untrimmed_output" format="fastqsanger" metadata_source="input_1" from_work_dir="untrimmed_output*" label="${tool.name} on ${on_string}: Untrimmed Read 1" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
356 <filter>output_selector and 'untrimmed_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
357 <expand macro="inherit_format_1" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
358 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
359 <data name="untrimmed_paired_output" format="fastqsanger" metadata_source="input_2" from_work_dir="untrimmed_paired_output*" label="${tool.name} on ${on_string}: Untrimmed Read 2" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
360 <filter>library['type'] == 'paired' or library['type'] == 'paired_collection'</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
361 <filter>output_selector and 'untrimmed_file' in output_selector </filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
362 <expand macro="inherit_format_2" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
363 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
364
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
365 <data name="too_short_output" format="fastqsanger" metadata_source="input_1" from_work_dir="too_short_output*" label="${tool.name} on ${on_string}: Too Short Read 1" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
366 <filter>output_selector and 'too_short_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
367 <expand macro="inherit_format_1" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
368 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
369 <data name="too_short_paired_output" format="fastqsanger" metadata_source="input_2" from_work_dir="too_short_paired_output*" label="${tool.name} on ${on_string}: Too Short Read 2" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
370 <filter>library['type'] == 'paired' or library['type'] == 'paired_collection'</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
371 <filter>output_selector and 'too_short_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
372 <expand macro="inherit_format_2" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
373 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
374 <data name="too_long_output" format="fastqsanger" metadata_source="input_1" from_work_dir="too_long_output*" label="${tool.name} on ${on_string}: Too Long Read 1" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
375 <filter>output_selector and 'too_long_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
376 <expand macro="inherit_format_1" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
377 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
378 <data name="too_long_paired_output" format="fastqsanger" metadata_source="input_2" from_work_dir="too_long_paired_output*" label="${tool.name} on ${on_string}: Too Long Read 2" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
379 <filter>library['type'] == 'paired' or library['type'] == 'paired_collection'</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
380 <filter>output_selector and 'too_long_file' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
381 <expand macro="inherit_format_2" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
382 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
383 <data name="json_stats" format="json" from_work_dir="stats.json" label="${tool.name} on ${on_string}: Statistics (JSON)" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
384 <filter>output_selector and 'json_stats' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
385 </data>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
386 <collection name="split_output" type="list" label="${tool.name} on ${on_string}: Split outputs" format="fastqsanger" >
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
387 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.(?P&lt;ext&gt;fastq.*)" directory="split" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
388 <filter>output_selector and 'multiple_output' in output_selector</filter>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
389 </collection>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
390 </outputs>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
391
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
392 <tests>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
393 <!-- Ensure fastq works -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
394 <test expect_num_outputs="1">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
395 <param name="type" value="single" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
396 <param name="input_1" ftype="fastq" value="cutadapt_small.fastq" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
397 <section name="r1">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
398 <repeat name="adapters">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
399 <conditional name="adapter_source">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
400 <param name="adapter_source_list" value="user"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
401 <param name="adapter" value="AGATCGGAAGAGC"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
402 </conditional>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
403 </repeat>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
404 </section>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
405 <output name="out1" file="cutadapt_small.out" ftype="fastq"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
406 </test>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
407 <!-- Ensure single end fastq.gz works -->
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
408 <test expect_num_outputs="1">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
409 <param name="type" value="single" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
410 <param name="input_1" ftype="fastq.gz" value="bwa-mem-fastq1.fq.gz" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
411 <section name="r1">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
412 <repeat name="adapters">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
413 <conditional name="adapter_source">
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
414 <param name="adapter_source_list" value="user"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
415 <param name="adapter" value="AGATCGGAAGAGC"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
416 </conditional>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
417 </repeat>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
418 </section>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
419 <output name="out1" decompress="True" file="cutadapt_out1.fq.gz" ftype="fastq.gz"/>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
420 </test>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
421 </tests>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
422
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
423 <help><![CDATA[
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
424
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
425 .. class:: infomark
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
426
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
427 **What it does**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
428
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
429 -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
430
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
431 **Cutadapt** finds and removes adapter sequences, primers, poly-A tails and other types of unwanted sequence from your high-throughput sequencing reads.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
432
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
433 Cleaning your data in this way is often required: Reads from small-RNA sequencing contain the 3’ sequencing adapter because the read is longer than the molecule that is sequenced, such as in microRNA, or CRISPR data, or Poly-A tails that are useful for pulling out RNA from your sample but often you don’t want them to be in your reads.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
434
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
435 Cutadapt_ helps with these trimming tasks by finding the adapter or primer sequences in an error-tolerant way. It can also modify and filter reads in various ways. Cutadapt searches for the adapter in all reads and removes it when it finds it. Unless you use a filtering option, all reads that were present in the input file will also be present in the output file, some of them trimmed, some of them not. Even reads that were trimmed entirely (because the adapter was found in the very beginning) are output. All of this can be changed with options in the tool form above.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
436
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
437 The tool is based on the **Open Source** Cutadapt_ tool. See the complete `Cutadapt documentation`_ for additional details. If you use Cutadapt, please cite *Marcel, 2011* under **Citations** below.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
438
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
439 -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
440
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
441 **Inputs**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
442
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
443 -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
444
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
445 Input files for Cutadapt need to be:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
446
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
447 - FASTQ.GZ, FASTQ.BZ2, FASTQ or FASTA
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
448
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
449 To trim an adapter, input the ADAPTER sequence in plain text or in a FASTA file e.g. AACCGGTT (with the characters: **$**, **^**, **...**, if anchored or linked).
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
450
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
451 ============================================= ===================
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
452 **Option** **Sequence**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
453 --------------------------------------------- -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
454 3’ (End) Adapter ADAPTER
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
455 Anchored 3’ Adapter ADAPTER$
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
456
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
457 5’ (Front) Adapter ADAPTER
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
458 Anchored 5’ Adapter ^ADAPTER
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
459
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
460 5’ or 3’ (Both possible) ADAPTER
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
461
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
462 Linked Adapter - 3' (End) only ADAPTER1...ADAPTER2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
463 Non-anchored Linked Adapter - 5' (Front) only ADAPTER1...ADAPTER2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
464 ============================================= ===================
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
465
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
466 Below is an illustration of the allowed adapter locations relative to the read and depending on the adapter type:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
467
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
468 .. image:: $PATH_TO_IMAGES/adapters.svg
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
469
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
470
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
471 -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
472
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
473 *Example: Illumina TruSeq Adapters*
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
474
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
475 -------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
476
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
477 If you have reads containing Illumina TruSeq adapters, for example, follow these steps.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
478
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
479
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
480 For Single-end reads as well as the first reads of Paired-end data:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
481
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
482 **Read 1**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
483
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
484 In the **3' (End) Adapters** option above, insert A + the “TruSeq Indexed Adapter” prefix that is common to all Indexed Adapter sequences, e.g insert:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
485
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
486 AGATCGGAAGAGCACACGTCTGAACTCCAGTCAC
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
487
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
488
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
489 For the second reads of Paired-end data:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
490
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
491 **Read 2**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
492
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
493 In the **3' (End) Adapters** option above, insert the reverse complement of the “TruSeq Universal Adapter”:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
494
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
495 AGATCGGAAGAGCGTCGTGTAGGGAAAGAGTGTAGATCTCGGTGGTCGCCGTATCATT
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
496
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
497 The adapter sequences can be found in the document `Illumina TruSeq Adapters De-Mystified`_.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
498
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
499 -----------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
500
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
501 **Outputs**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
502
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
503 -----------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
504
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
505 - Trimmed reads
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
506
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
507 Optionally, under **Output Options** you can choose to output
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
508
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
509 * Report
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
510 * Info file
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
511
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
512
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
513 **Report**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
514
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
515 Cutadapt can output per-adapter statistics if you select to output the report above.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
516
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
517 Example:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
518
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
519 ::
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
520
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
521 This is cutadapt 3.4 with Python 3.9.2
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
522
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
523 Command line parameters: -j=1 -a AGATCGGAAGAGC -A AGATCGGAAGAGC --output=out1.fq.gz --paired-output=out2.fq.gz --error-rate=0.1 --times=1
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
524 --overlap=3 --action=trim --minimum-length=30:40 --pair-filter=both --cut=0 bwa-mem-fastq1_assimetric_fq_gz.fq.gz bwa-mem-fastq2_assimetric_fq_gz.fq.gz
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
525
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
526 Processing reads on 1 core in paired-end mode ...
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
527 Finished in 0.01 s (129 µs/read; 0.46 M reads/minute).
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
528
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
529 === Summary ===
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
530
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
531 Total read pairs processed: 99
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
532 Read 1 with adapter: 2 (2.0%)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
533 Read 2 with adapter: 4 (4.0%)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
534 Pairs that were too short: 3 (3.0%)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
535 Pairs written (passing filters): 96 (97.0%)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
536
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
537 Total basepairs processed: 48,291 bp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
538 Read 1: 24,147 bp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
539 Read 2: 24,144 bp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
540 Total written (filtered): 48,171 bp (99.8%)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
541 Read 1: 24,090 bp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
542 Read 2: 24,081 bp
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
543
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
544
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
545 **Info file**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
546
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
547 The info file contains information about the found adapters. The output is a tab-separated text file. Each line corresponds to one read of the input file.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
548
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
549 Columns contain the following data:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
550
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
551 * **1st**: Read name
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
552 * **2nd**: Number of errors
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
553 * **3rd**: 0-based start coordinate of the adapter match
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
554 * **4th**: 0-based end coordinate of the adapter match
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
555 * **5th**: Sequence of the read to the left of the adapter match (can be empty)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
556 * **6th**: Sequence of the read that was matched to the adapter
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
557 * **7th**: Sequence of the read to the right of the adapter match (can be empty)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
558 * **8th**: Name of the found adapter
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
559 * **9th**: Quality values corresponding to sequence left of the adapter match (can be empty)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
560 * **10th**: Quality values corresponding to sequence matched to the adapter (can be empty)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
561 * **11th**: Quality values corresponding to sequence to the right of the adapter (can be empty)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
562
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
563 The concatenation of columns 5-7 yields the full read sequence. Column 8 identifies the found adapter. Adapters without a name are numbered starting from 1. Fields 9-11 are empty if quality values are not available. Concatenating them yields the full sequence of quality values.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
564
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
565 If no adapter was found, the format is as follows:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
566
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
567 #. Read name
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
568 #. The value -1
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
569 #. The read sequence
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
570 #. Quality values
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
571
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
572 When parsing the file, be aware that additional columns may be added in the future. Note also that some fields can be empty, resulting in consecutive tabs within a line.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
573
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
574 If the --times option is used and greater than 1, each read can appear more than once in the info file. There will be one line for each found adapter, all with identical read names. Only for the first of those lines will the concatenation of columns 5-7 be identical to the original read sequence (and accordingly for columns 9-11). For subsequent lines, the shown sequence are the ones that were used in subsequent rounds of adapter trimming, that is, they get successively shorter.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
575
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
576
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
577 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
578
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
579 **Rename Reads**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
580
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
581 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
582
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
583
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
584 The --rename option expects a template string such as {id} extra_info {adapter_name} as a parameter. It can contain regular text and placeholders that consist of a name enclosed in curly braces ({placeholdername}).
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
585
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
586 The read name will be set to the template string in which the placeholders are replaced with the actual values relevant for the current read.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
587
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
588 The following placeholders are currently available for single-end reads:
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
589
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
590 * {header} – the full, unchanged header
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
591 * {id} – the read ID, that is, the part of the header before the first whitespace
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
592 * {comment} – the part of the header after the whitespace following the ID
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
593 * {adapter_name} – the name of adapter that was found in this read or no_adapter if there was none adapter match. If you use --times to do multiple rounds of adapter matching, this is the name of the last found adapter.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
594 * {match_sequence} – the sequence of the read that matched the adapter (including errors). If there was no adapter match, this is set to an empty string. If you use a linked adapter, this is to the two matching strings, separated by a comma.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
595 * {cut_prefix} – the prefix removed by the --cut (or -u) option (that is, when used with a positive length argument)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
596 * {cut_suffix} – the suffix removed by the --cut (or -u) option (that is, when used with a negative length argument)
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
597 * {rc} – this is replaced with the string rc if the read was reverse complemented. This only applies when reverse complementing was requested
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
598
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
599 If the --rename option is used with paired-end data, the template is applied separately to both R1 and R2. That is, for R1, the placeholders are replaced with values from R1, and for R2, the placeholders are replaced with values from R2. For example, {comment} becomes R1’s comment in R1 and it becomes R2’s comment in R2.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
600
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
601 For paired-end data, the placeholder {rn} is available (“read number”), and it is replaced with 1 in R1 and with 2 in R2.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
602
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
603 In addition, it is possible to write a placeholder as {r1.placeholdername} or {r2.placeholdername}, which always takes the replacement value from R1 or R2, respectively.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
604 The {r1.placeholder} and {r2.placeholder} notation is available for all placeholders except {rn} and {id} because the read ID needs to be identical for both reads.
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
605
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
606 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
607
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
608 **More Information**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
609
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
610 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
611
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
612 See the excellent `Cutadapt documentation`_
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
613
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
614 .. _Cutadapt: https://cutadapt.readthedocs.io/en/stable/
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
615 .. _`Cutadapt documentation`: https://cutadapt.readthedocs.io/en/latest/index.html
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
616 .. _`Illumina TruSeq Adapters De-Mystified`: http://tucf-genomics.tufts.edu/documents/protocols/TUCF_Understanding_Illumina_TruSeq_Adapters.pdf
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
617
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
618
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
619 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
620
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
621 **Galaxy Wrapper Development**
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
622
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
623 --------------------
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
624
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
625 Author: Lance Parsons <lparsons@princeton.edu>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
626
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
627 ]]></help>
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
628 <expand macro="citations" />
b4479aea41df Uploaded
jackcurragh
parents:
diff changeset
629 </tool>