comparison kodoja_search.xml @ 0:18fe33eb7775 draft

Uploaded kodoja_search.py v0.0.3 wrapper. https://github.com/abaizan/kodoja_galaxy/commit/55004d41a9c0750b2543f394594ee58cc4426609
author peterjc
date Wed, 14 Mar 2018 12:46:57 -0400
parents
children 4554fcd4ef6d
comparison
equal deleted inserted replaced
-1:000000000000 0:18fe33eb7775
1 <tool id="kodoja_search" name="Kodoja database search" version="0.0.0">
2 <description>identify viruses from plant RNA sequencing data</description>
3 <requirements>
4 <requirement type="package" version="0.0.3">kodoja</requirement>
5 </requirements>
6 <version_command>kodoja_search.py --version</version_command>
7 <command detect_errors="exit_code"><![CDATA[
8 kodoja_search.py
9
10 --kraken_db '${kraken_db.fields.path}'
11 --kaiju_db '${kaiju_db.fields.path}'
12
13 #if $single_paired.single_paired_selector == 'yes'
14 #if $forward_input.is_of_type( 'fastq' ):
15 --data_format fastq
16 #else:
17 --data_format fasta
18 #end if
19 --read1 '${single_paired.forward_input}'
20 --read2 '${single_paired.reverse_input}'
21 #else:
22 #if $single_paired.input_sequences.is_of_type('fastq')
23 --data_format fastq
24 #else:
25 --data_format fasta
26 #end if
27 --read1 '${single_paired.input_sequences}'
28 #end if
29
30 ## TODO:
31 ## -m min_trim
32 ## -a trim_adapt
33 ## -q kraken_quick
34 ## -p kraken_preload
35 ## -c kaiju_score
36 ## -l kaiju_minlen
37 ## -i kaiju_mismatch
38
39 ## We'll capture predictably named output files from here:
40 -o .
41 &&
42 mv ./virus_table.txt '$combined_table'
43 ]]></command>
44 <inputs>
45 <param label="Select a Kraken database" name="kraken_db" type="select">
46 <options from_data_table="kraken_databases">
47 <validator message="No Kraken database is available" type="no_options" />
48 </options>
49 </param>
50 <param label="Select a Kaiju database" name="kaiju_db" type="select">
51 <options from_data_table="kaiju_databases">
52 <validator message="No Kaiju database is available" type="no_options" />
53 </options>
54 </param>
55 <conditional name="single_paired">
56 <param name="single_paired_selector" type="select" label="Single or paired reads" help="--paired">
57 <!-- TODO?
58 <option value="collection">Collection</option>
59 -->
60 <option value="yes">Paired</option>
61 <option selected="True" value="no">Single</option>
62 </param>
63 <when value="yes">
64 <param format="fasta,fastq" name="forward_input" type="data" label="Forward strand" help="FASTA or FASTQ dataset"/>
65 <param format="fasta,fastq" name="reverse_input" type="data" label="Reverse strand" help="FASTA or FASTQ dataset"/>
66 </when>
67 <when value="no">
68 <param format="fasta,fastq" label="Input sequences" name="input_sequences" type="data" help="FASTA or FASTQ datasets"/>
69 </when>
70 </conditional>
71 </inputs>
72 <outputs>
73 <data name="combined_table" format="tabular" label="Kodoja species report for ${on_string}" />
74 </outputs>
75 <tests>
76 <test>
77 <param name="kraken_db" value="kraken3viruses" />
78 <param name="kaiju_db" value="kaiju3viruses" />
79 <param name="single_paired_selector" value="no" />
80 <param name="input_sequences" value="testData_1.fastq" ftype="fastq" />
81 <output name="combined_table" file="virus_table_SE_fastq.tabular" ftype="tabular" />
82 </test>
83 <test>
84 <param name="kraken_db" value="kraken3viruses" />
85 <param name="kaiju_db" value="kaiju3viruses" />
86 <param name="single_paired_selector" value="yes" />
87 <param name="forward_input" value="testData_1.fastq" ftype="fastq" />
88 <param name="reverse_input" value="testData_2.fastq" ftype="fastq" />
89 <output name="combined_table" file="virus_table_PE_fastq.tabular" ftype="tabular" />
90 </test>
91 <test>
92 <param name="kraken_db" value="kraken3viruses" />
93 <param name="kaiju_db" value="kaiju3viruses" />
94 <param name="single_paired_selector" value="yes" />
95 <param name="forward_input" value="testData_1.fasta" ftype="fasta" />
96 <param name="reverse_input" value="testData_2.fasta" ftype="fasta" />
97 <output name="combined_table" file="virus_table_PE_fasta.tabular" ftype="tabular" />
98 </test>
99 </tests>
100 <help><![CDATA[
101 Kodoja is a tool intended to identify viral sequences in a
102 FASTQ/FASTA sequencing run by matching them against both
103 Kraken and Kaiju databases.
104
105 The main output is a five column tab-separated table as follows
106 (tabular format in Galaxy):
107
108 1. Species name
109 2. Species NCBI taxonomy identifier (TaxID)
110 3. Number of reads assigned by *either* Kraken or Kaiju to this species
111 4. Number of Reads assigned by *both* Kraken and Kaiju to this species
112 5. Genus name
113 6. Number of reads assigned by *either* Kraken or Kaiju to this genus
114 7. Number of reads assigned by *both* Kraken and Kaiju to this genus
115
116 For example,
117
118 ================================== ============= ================= ============================= ========== =============== ===========================
119 Species Species TaxID Species sequences Species sequences (stringent) Genus Genus sequences Genus sequences (stringent)
120 ---------------------------------- ------------- ----------------- ----------------------------- ---------- --------------- ---------------------------
121 Cassava brown streak virus 137758 45 45 Ipomovirus
122 Ugandan cassava brown streak virus 946046 28 28 Ipomovirus
123 Tobacco etch virus 12227 21 19 Potyvirus
124 ================================== ============= ================= ============================= ========== =============== ===========================
125
126 This is the command line tool's help::
127
128 usage: kodoja_search.py [-h] [--version] -o OUTPUT_DIR -d1 KRAKEN_DB -d2
129 KAIJU_DB -r1 READ1 [-r2 READ2] [-f DATA_FORMAT]
130 [-t THREADS] [-s] [-m TRIM_MINLEN] [-a TRIM_ADAPT]
131 [-q KRAKEN_QUICK] [-p] [-c KAIJU_SCORE]
132 [-l KAIJU_MINLEN] [-i KAIJU_MISMATCH]
133
134 Kodoja
135
136 optional arguments:
137 -h, --help show this help message and exit
138 --version show program's version number and exit
139 -o OUTPUT_DIR, --output_dir OUTPUT_DIR
140 Output directory path, required
141 -d1 KRAKEN_DB, --kraken_db KRAKEN_DB
142 Kraken database path, required
143 -d2 KAIJU_DB, --kaiju_db KAIJU_DB
144 Kaiju database path, required
145 -r1 READ1, --read1 READ1
146 Read 1 file path, required
147 -r2 READ2, --read2 READ2
148 Read 2 file path
149 -f DATA_FORMAT, --data_format DATA_FORMAT
150 Sequence data format
151 -t THREADS, --threads THREADS
152 Number of threads
153 -s, --host_subset Subset host sequences before Kaiju
154 -m TRIM_MINLEN, --trim_minlen TRIM_MINLEN
155 Trimmomatic minimum length
156 -a TRIM_ADAPT, --trim_adapt TRIM_ADAPT
157 Illumina adapter sequence file
158 -q KRAKEN_QUICK, --kraken_quick KRAKEN_QUICK
159 Number of minium hits by Kraken
160 -p, --kraken_preload Kraken preload database
161 -c KAIJU_SCORE, --kaiju_score KAIJU_SCORE
162 Kaju alignment score
163 -l KAIJU_MINLEN, --kaiju_minlen KAIJU_MINLEN
164 Kaju minimum length
165 -i KAIJU_MISMATCH, --kaiju_mismatch KAIJU_MISMATCH
166 Kaju allowed mismatches
167
168 ]]></help>
169 <citations>
170 <citation type="bibtex">
171 @misc{githubkodoja,
172 author = {Baizan Edge, Amanda},
173 year = {2018},
174 title = {Kodoja},
175 publisher = {GitHub},
176 journal = {GitHub repository},
177 url = {https://github.com/abaizan/kodoja},
178 }</citation>
179 </citations>
180 </tool>