annotate copyrighter.xml @ 0:7a7ecf9b9df7 draft

Initial upload
author fangly
date Mon, 29 Jul 2013 06:52:36 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
1 <tool id="copyrighter" name="CopyRighter" version="0.45">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
2
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
3 <description>trait bias corrector for microbial profiles</description>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
4
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
5 <requirements>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
6 <requirement type="binary">copyrighter</requirement>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
7 </requirements>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
8
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
9 <version_string>copyrighter --version</version_string>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
10
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
11 <command>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
12 copyrighter
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
13 -i $input
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
14 -d $database.value
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
15 #if str($lookup):
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
16 -l $lookup
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
17 #end if
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
18 #if str($total) != "None":
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
19 -t $total
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
20 #end if
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
21 #if str($verbose):
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
22 -v
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
23 #end if
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
24 </command>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
25
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
26 <inputs>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
27 <param name="input" type="data" format="txt" label="Input community file" help="Text file obtained from 16S rRNA microarray, 16S rRNA amplicon sequencing or metagenomic sequencing, in biom, QIIME, GAAS, Unifrac, or generic (tabular site-by-species) format. The file must contain read counts (not percentages) and taxa must have UNALTERED taxonomic assignments." />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
28 <conditional name="database">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
29 <param name="specify" type="select" label="Trait database" help="Tab-delimited file of traits: 16S copy number, genome length, ...">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
30 <option value="builtin">Built-in file</option>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
31 <option value="uploaded">Uploaded file</option>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
32 </param>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
33 <when value="builtin">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
34 <param name="value" type="select" label="Built-in file">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
35 <options from_data_table="trait_db" />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
36 <validator type="no_options" message="No built-in trait database is available"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
37 </param>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
38 </when>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
39 <when value="uploaded">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
40 <param name="value" type="data" format="tabular" label="Uploaded file" />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
41 </when>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
42 </conditional>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
43 <param name="lookup" type="select" display="radio" value="desc" label="Lookup method" help="What to match when looking up the trait value of a taxon.">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
44 <option value="desc">OTU name</option>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
45 <option value="id">OTU ID (if recorded in your input community file)</option>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
46 </param>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
47 <param name="total" type="data" format="tabular" optional="true" label="Total abundance file" help="Tab-delimited file containing the total microbial abundance of each community, e.g. 16S rRNA quantitative PCR numbers to be corrected by the average 16S rRNA copy number." />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
48 <param name="verbose" type="boolean" checked="no" truevalue="1" falsevalue="0" format="txt" label="Verbose" help="Display trait value assignments." />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
49 </inputs>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
50
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
51 <outputs>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
52 <data format="txt" name="relative" from_work_dir="out_copyrighted.txt" label="${tool.name} from ${on_string} (relative)"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
53 <data format="tabular" name="absolute" from_work_dir="out_copyrighted_total.tsv" label="${tool.name} from ${on_string} (absolute)">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
54 <filter>str(total) != "None"</filter>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
55 </data>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
56 <data format="txt" name="combined" from_work_dir="out_copyrighted_combined.txt" label="${tool.name} from ${on_string} (combined)">
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
57 <filter>str(total) != "None"</filter>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
58 </data>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
59 </outputs>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
60
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
61 <stdio>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
62 <exit_code range="1:" level="fatal" />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
63 <regex match="error|exception|invalid" source="stderr" level="fatal" />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
64 </stdio>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
65
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
66 <tests>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
67 <test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
68 <param name="input" value="test_data/in.qiime" />
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
69 <param name="specify" value="uploaded"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
70 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
71 <output name="relative" file="test_data/out.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
72 </test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
73 <test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
74 <param name="input" value="test_data/in.biom"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
75 <param name="specify" value="uploaded"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
76 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
77 <output name="relative" file="test_data/out.biom" lines_diff="2"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
78 </test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
79 <test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
80 <param name="input" value="test_data/in.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
81 <param name="specify" value="uploaded"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
82 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
83 <param name="verbose" value="yes"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
84 <output name="relative" file="test_data/out.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
85 </test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
86 <test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
87 <param name="input" value="test_data/in.biom"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
88 <param name="specify" value="uploaded"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
89 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
90 <param name="lookup" value="id"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
91 <output name="relative" file="test_data/out2.biom" lines_diff="2"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
92 </test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
93 <test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
94 <param name="input" value="test_data/in.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
95 <param name="specify" value="uploaded"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
96 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
97 <param name="total" value="test_data/in_total.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
98 <output name="relative" file="test_data/out.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
99 <output name="absolute" file="test_data/out_total.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
100 <output name="combined" file="test_data/out_combined.qiime"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
101 </test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
102 <!--<test>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
103 <param name="input" value="test_data/in.biom"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
104 <param name="specify" value="builtin"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
105 <param name="value" value="test_data/in_db.tsv"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
106 <output name="relative" file="test_data/out.biom" lines_diff="2"/>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
107 </test>-->
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
108 </tests>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
109
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
110 <help>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
111 **What CopyRighter does**
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
112
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
113 The genome of Bacteria and Archaea often contains several copies of the
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
114 16S rRNA gene. This can lead to significant biases when estimating the
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
115 composition of microbial communities using 16S rRNA amplicons or
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
116 microarrays or their total abundance using 16S rRNA quantitative PCR,
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
117 since species with a large number of copies will contribute
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
118 disproportionally more 16S amplicons than species with a unique copy.
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
119 Fortunately, it is possible to infer the copy number of unsequenced
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
120 microbial species, based on that of close relatives that have been fully
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
121 sequenced. Using this information, CopyRigher corrects microbial
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
122 relative abundance by applying a weight proportional to the inverse of
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
123 the estimated copy number to each species.
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
124
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
125 In metagenomic surveys, a similar problem arises due to genome length
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
126 variations between species, and can be corrected by CopyRighter as well.
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
127
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
128 In all cases, a community file is used as input and a corrected community
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
129 file with trait-corrected (16S rRNA gene copy number or genome length)
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
130 relative abundances is generated. Total abundance can optionally be
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
131 provided, corrected and combined with relative abundance estimates to
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
132 get the absolute abundance of each species. Also the average trait value
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
133 in each community is reported on standard output.
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
134 </help>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
135
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
136 </tool>
7a7ecf9b9df7 Initial upload
fangly
parents:
diff changeset
137