annotate redup.xml @ 0:df1e7c7dd9cb draft default tip

Initial uploaded of files
author jgarbe
date Wed, 27 Nov 2013 14:39:56 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
1 <tool id="redup" name="Redup" version="1.0">
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
2 <description>Remove exact duplicate reads from paired-end fastq files</description>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
3 <command interpreter="perl">
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
4 ## Need to handle file names, probably should fix redup.pl
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
5 redup.pl
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
6 #if $opt_n:
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
7 -n $opt_n
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
8 #end if
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
9 $fastq1_in $fastq2_in $unique1_out $unique2_out
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
10 #if $opt_n:
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
11 > $duplicates
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
12 #end if
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
13 </command>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
14 <inputs>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
15 <param name="fastq1_in" type="data" format="fastq" label="Fastq Input 1"/>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
16 <param name="fastq2_in" type="data" format="fastq" label="Fastq Input 2"/>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
17 <param name="opt_n" type="integer" value="20" optional="true" label="Number of most duplicated sequences printed out. (default 20)">
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
18 <validator type="in_range" message="Value can not be negative" min="0"/>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
19 </param>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
20 </inputs>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
21 <stdio>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
22 <exit_code range="1:" level="fatal"/>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
23 </stdio>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
24 <outputs>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
25 <data format_source="fastq1_in" name="unique1_out" label="${tool.name} on ${on_string}: fastq1.unique" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
26 <data format_source="fastq2_in" name="unique2_out" label="${tool.name} on ${on_string}: fastq2.unique" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
27 <data format="fasta" name="duplicates" label="${tool.name} on ${on_string}: top duplicates" >
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
28 <filter>opt_n != None</filter>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
29 </data>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
30 </outputs>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
31 <tests>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
32 <test>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
33 <param name="fastq1_in" ftype="fastq" value="input1.fastq" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
34 <param name="fastq2_in" ftype="fastq" value="input2.fastq" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
35 <param name="opt_n" value="20" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
36 <output name="unique1_out" file="output1.fastq" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
37 <output name="unique2_out" file="output2.fastq" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
38 <output name="duplicates" file="duplicates.fasta" />
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
39 </test>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
40 </tests>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
41
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
42 <help>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
43 This script removes duplicate paired-end reads from the input files sample1_R1.fastq and sample1_R2.fastq and prints out unique reads to the files sample1_R1.fastq.unique and sample2_R2.fastq.unique. Reads must have the exact same sequence to be called duplicates, quality scores are ignored. The top N (default 20) most duplicated sequences are printed out in fasta format, making it convenient for using BLAST to identify them.
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
44 </help>
df1e7c7dd9cb Initial uploaded of files
jgarbe
parents:
diff changeset
45 </tool>