Mercurial > repos > nml > refseq_masher
annotate contains.xml @ 1:2c1cb37a3ffe draft
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
author | nml |
---|---|
date | Wed, 08 May 2019 09:15:56 -0400 |
parents | 26df66c32861 |
children | 1ec42f033bb4 |
rev | line source |
---|---|
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
1 <tool id="refseq_masher_contains" name="RefSeq Masher Contains" version="0.1.2"> |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
2 <description> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
3 Find NCBI RefSeq Genomes contained in your sequences |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
4 </description> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
5 <requirements> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
6 <requirement type="package" version="0.1.1">refseq_masher</requirement> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
7 </requirements> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
8 <command detect_errors="exit_code"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
9 <![CDATA[ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
10 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
11 #import re |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
12 #import os |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
13 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
14 #if $input.type == 'fasta' |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
15 #set $input_files = '"{}.fasta"'.format(os.path.splitext($input.fasta.name)[0]) |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
16 ln -s "$input.fasta" $input_files && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
17 #elif $input.type == 'paired' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
18 #set $_forward_ext = '.fastq.gz' if $re.match(r'.*\.gz$', $input.forward.name) else '.fastq' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
19 #set $_forward = '"{}_1{}"'.format($re.sub(r'_[12]\..+$', '', $input.forward.name), $_forward_ext) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
20 #set $_reverse_ext = '.fastq.gz' if $re.match(r'.*\.gz$', $input.reverse.name) else '.fastq' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
21 #set $_reverse = '"{}_2{}"'.format($re.sub(r'_[12]\..+$', '', $input.reverse.name), $_reverse_ext) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
22 #set $input_files = '{} {}'.format($_forward, $_reverse) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
23 ln -s "$input.forward" $_forward && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
24 ln -s "$input.reverse" $_reverse && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
25 #elif $input.type == 'single' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
26 #set $input_files = '"{}"'.format($input.single.name) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
27 ln -s "$input.single" $input_files && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
28 #elif $input.type == 'paired_collection' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
29 #set $_forward_ext = '.fastq.gz' if $re.match(r'.*\.gz$', str($input.paired_collection.forward)) else '.fastq' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
30 #set $_forward = '"{}_1{}"'.format($input.paired_collection.name, $_forward_ext) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
31 #set $_reverse_ext = '.fastq.gz' if $re.match(r'.*\.gz$', str($input.paired_collection.reverse)) else '.fastq' |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
32 #set $_reverse = '"{}_2{}"'.format($input.paired_collection.name, $_reverse_ext) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
33 #set $input_files = '{} {}'.format($_forward, $_reverse) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
34 ln -s "$input.paired_collection.forward" $_forward && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
35 ln -s "$input.paired_collection.reverse" $_reverse && |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
36 #end if |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
37 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
38 refseq_masher |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
39 $adv.verbosity |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
40 contains |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
41 --output refseq_masher-contains.${adv.output_type} |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
42 --output-type $adv.output_type |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
43 --top-n-results $adv.top_n_results |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
44 --parallelism "\${GALAXY_SLOTS:-1}" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
45 --min-identity $adv.min_identity |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
46 --max-pvalue $adv.max_pvalue |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
47 $input_files |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
48 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
49 ]]> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
50 </command> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
51 <inputs> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
52 <conditional name="input"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
53 <param name="type" type="select" label="Sequence input type"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
54 <option value="fasta">FASTA</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
55 <option value="paired">Paired-end FASTQs</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
56 <option value="single">Single-end FASTQ</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
57 <option value="paired_collection">Paired-end FASTQ collection</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
58 </param> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
59 <when value="fasta"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
60 <param name="fasta" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
61 type="data" format="fasta" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
62 optional="false" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
63 label="FASTA file" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
64 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
65 </when> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
66 <when value="paired"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
67 <param name="forward" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
68 type="data" format="fastq,fastqsanger,fastqillumina,fastqsolexa" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
69 optional="false" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
70 label="Forward FASTQ file" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
71 help="Must have ASCII encoded quality scores" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
72 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
73 <param name="reverse" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
74 type="data" format="fastq,fastqsanger,fastqillumina,fastqsolexa" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
75 optional="false" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
76 label="Reverse FASTQ file" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
77 help="File format must match the Forward FASTQ file" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
78 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
79 </when> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
80 <when value="single"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
81 <param name="single" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
82 type="data" format="fastq,fastqsanger,fastqillumina,fastqsolexa" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
83 optional="false" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
84 label="Single-end FASTQ file" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
85 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
86 </when> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
87 <when value="paired_collection"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
88 <param name="paired_collection" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
89 type="data_collection" format="fastq,fastqsanger,fastqillumina,fastqsolexa,fastq.gz,txt" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
90 collection_type="paired" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
91 optional="false" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
92 label="Paired-end FASTQ collection" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
93 help="" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
94 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
95 </when> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
96 </conditional> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
97 <section name="adv" title="Advanced Options" expanded="false"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
98 <param name="top_n_results" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
99 type="integer" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
100 label="Top N matches to report (0 to report all)" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
101 min="0" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
102 value="0" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
103 optional="true" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
104 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
105 <param name="min_identity" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
106 type="float" value="0.9" min="0.0" max="1.0" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
107 label="Mash dist min. identity to report" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
108 optional="true" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
109 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
110 <param name="max_pvalue" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
111 type="float" value="0.01" min="0.0" max="1.0" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
112 label="Mash screen max. p-value to report" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
113 optional="true" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
114 /> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
115 <param name="output_type" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
116 type="select" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
117 label="Output type" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
118 multiple="false"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
119 <option value="tab" selected="true">Tabular (tab-delimited values)</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
120 <option value="csv">CSV (Comma Separated Values)</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
121 </param> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
122 <param name="verbosity" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
123 type="select" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
124 label="Logging verbosity"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
125 <option value="">Error messages only</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
126 <option value="-v">Show warning messages</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
127 <option value="-vv" selected="true">Show info messages</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
128 <option value="-vvv">Show debug messages</option> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
129 </param> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
130 </section> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
131 </inputs> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
132 <outputs> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
133 <data |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
134 name="output_path_csv" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
135 format="csv" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
136 label="RefSeq Masher contains table" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
137 from_work_dir="refseq_masher-contains.csv"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
138 <filter>adv['output_type'] == 'csv'</filter> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
139 </data> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
140 <data |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
141 name="output_path_tab" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
142 format="tabular" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
143 label="RefSeq Masher contains table" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
144 from_work_dir="refseq_masher-contains.tab"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
145 <filter>adv['output_type'] == 'tab'</filter> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
146 </data> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
147 </outputs> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
148 <tests> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
149 <test> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
150 <conditional name="input"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
151 <param name="type" value="single"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
152 <param name="single" value="SRR1203042_1-head4000.fastq"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
153 </conditional> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
154 <section name="adv"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
155 <param name="top_n_results" value="5"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
156 <param name="output_type" value="tab"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
157 <param name="min_identity" value="0.9"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
158 <param name="max_pvalue" value="0.01"/> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
159 </section> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
160 <output name="output_path_tab" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
161 value="SRR1203042_1-head4000-contains.tab" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
162 ftype="tabular" |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
163 lines_diff="0"> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
164 </output> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
165 </test> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
166 </tests> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
167 <help> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
168 <![CDATA[ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
169 RefSeq Masher - Containment |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
170 =========================== |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
171 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
172 Find what NCBI RefSeq genomes are contained within your sequence data using Mash_ with a Mash sketch database of 54,925 NCBI RefSeq Genomes. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
173 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
174 |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
175 Source code available on Github at github.com/phac-nml/refseq_masher |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
176 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
177 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
178 `contains` - find what NCBI RefSeq Genomes are contained in your input sequences |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
179 -------------------------------------------------------------------------------- |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
180 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
181 If you have a metagenomic sample or maybe a sample with some contamination, you may be interested in seeing what's in your sample. You can do this with `refseq_masher contains <INPUT>`.:: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
182 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
183 Usage: refseq_masher contains [OPTIONS] INPUT... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
184 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
185 Find the NCBI RefSeq genomes contained in your sequence files using Mash |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
186 Screen |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
187 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
188 Input is expected to be one or more FASTA/FASTQ files or one or more |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
189 directories containing FASTA/FASTQ files. Files can be Gzipped. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
190 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
191 Options: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
192 --mash-bin TEXT Mash binary path (default="mash") |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
193 -o, --output PATH Output file path (default="-"/stdout) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
194 --output-type [tab|csv] Output file type (tab|csv) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
195 -n, --top-n-results INTEGER Output top N results sorted by identity in |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
196 ascending order (default=0/all) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
197 -i, --min-identity FLOAT Mash screen min identity to report |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
198 (default=0.9) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
199 -v, --max-pvalue FLOAT Mash screen max p-value to report |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
200 (default=0.01) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
201 -p, --parallelism INTEGER Mash screen parallelism; number of threads to |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
202 spawn (default=1) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
203 -h, --help Show this message and exit. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
204 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
205 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
206 Example - metagenomic a sample SAMEA1877340_ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
207 ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
208 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
209 For this example, we're going to see what RefSeq genomes are contained within sample SAMEA1877340_ from BioProject PRJEB1775_. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
210 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
211 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
212 Description from BioProject PRJEB1775_: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
213 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
214 .. epigraph:: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
215 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
216 Design, Setting and Patients Forty-five samples were selected from a set of fecal specimens obtained from patients with diarrhea during the 2011 outbreak of STEC O104:H4 in Germany. Samples were chosen to represent STEC-positive patients with a range of clinical conditions and colony counts together with a small number of patients with other infections (Campylobacter jejnuni, Clostridium difficile and Salmonella enterica). Samples were subjected to high-throughput sequencing on the Illumina MiSeq and HiSeq 2500, followed by bioinformatics analysis. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
217 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
218 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
219 We're going to download the FASTQ files for ERR260489_:: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
220 |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
221 wget ftp.sra.ebi.ac.uk/vol1/fastq/ERR260/ERR260489/ERR260489_1.fastq.gz |
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
222 wget ftp.sra.ebi.ac.uk/vol1/fastq/ERR260/ERR260489/ERR260489_2.fastq.gz |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
223 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
224 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
225 We're going to run `refseq_masher` against these FASTQ files:: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
226 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
227 refseq_masher -vv contains --top-n-results 50 -p 12 -o containment-ERR260489.tab ERR260489_1.fastq.gz ERR260489_2.fastq.gz |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
228 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
229 **Log**:: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
230 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
231 2018-01-29 10:59:25,849 INFO: Grouped 2 fastqs into 1 groups [in ...refseq_masher/refseq_masher/utils.py:174] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
232 2018-01-29 10:59:25,849 INFO: Collected 0 FASTA inputs and 1 read sets [in ...refseq_masher/refseq_masher/utils.py:185] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
233 2018-01-29 10:59:25,849 INFO: Running Mash Screen with NCBI RefSeq sketch database against sample "ERR260489" with inputs: ['../ERR260489_1.fastq.gz', '../ERR260489_2.fastq.gz'] [in ...refseq_masher/refseq_masher/mash/screen.py:44] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
234 Loading ...refseq_masher/refseq_masher/data/RefSeqSketches.msh... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
235 4669418 distinct hashes. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
236 Streaming from 2 inputs... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
237 Estimated distinct k-mers in pool: 206836855 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
238 Summing shared... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
239 Computing coverage medians... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
240 Writing output... |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
241 2018-01-29 11:00:19,665 INFO: Ran Mash Screen on all input. Merging NCBI taxonomic information into results output. [in ...refseq_masher/refseq_masher/cli.py:134] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
242 2018-01-29 11:00:19,666 INFO: Fetching all taxonomy info for 23 unique NCBI Taxonomy UIDs [in ...refseq_masher/refseq_masher/taxonomy.py:35] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
243 2018-01-29 11:00:19,669 INFO: Dropping columns with all NA values (ncol=32) [in ...refseq_masher/refseq_masher/taxonomy.py:38] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
244 2018-01-29 11:00:19,671 INFO: Columns with all NA values dropped (ncol=12) [in ...refseq_masher/refseq_masher/taxonomy.py:40] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
245 2018-01-29 11:00:19,671 INFO: Merging Mash results with relevant taxonomic information [in ...refseq_masher/refseq_masher/taxonomy.py:41] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
246 2018-01-29 11:00:19,674 INFO: Merged Mash results with taxonomy info [in ...refseq_masher/refseq_masher/taxonomy.py:43] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
247 2018-01-29 11:00:19,674 INFO: Merged taxonomic information into results output [in ...refseq_masher/refseq_masher/cli.py:136] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
248 2018-01-29 11:00:19,674 INFO: Reordering output columns [in ...refseq_masher/refseq_masher/cli.py:137] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
249 2018-01-29 11:00:19,677 INFO: Wrote output to "containment-ERR260489.tab" [in ...refseq_masher/refseq_masher/writers.py:20] |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
250 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
251 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
252 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
253 **Output** |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
254 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
255 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
256 | sample | top_taxonomy_name | identity | shared_hashes | median_multiplicity | pvalue | full_taxonomy | taxonomic_subspecies | taxonomic_species | taxonomic_genus | taxonomic_family | taxonomic_order | taxonomic_class | taxonomic_phylum | taxonomic_superkingdom | subspecies | serovar | plasmid | bioproject | biosample | taxid | assembly_accession | match_id | taxonomic_species group | match_comment | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
257 +===========+======================================+==========+================+======================+========+==================================================================================================================================================+=======================+==============================+==================+====================+==================+=====================+===================+=========================+============+=========+==========+============+===========+=========+=====================+==============================================================================================+==========================+================+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
258 | ERR260489 | Bacteroides fragilis | 1.0 | 400/400 | 786 | 0.0 | Bacteria; FCB group; Bacteroidetes/Chlorobi group; Bacteroidetes; Bacteroidia; Bacteroidales; Bacteroidaceae; Bacteroides; fragilis | | Bacteroides fragilis | Bacteroides | Bacteroidaceae | Bacteroidales | Bacteroidia | Bacteroidetes | Bacteria | | | pLV22a | | | 817 | | ./rcn/refseq-NG-817-.-.-.-pLV22a-Bacteroides_fragilis.fna | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
259 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
260 | [1 row] | | | | | | | | | | | | | | | | | | | | | | | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
261 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
262 | ERR260489 | Escherichia coli O104:H4 str. E92/11 | 1.0 | 400/400 | 48 | 0.0 | Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales; Enterobacteriaceae; Escherichia; coli; O104:H4; str. E92/11 | | Escherichia coli | Escherichia | Enterobacteriaceae | Enterobacterales | Gammaproteobacteria | Proteobacteria | Bacteria | | | pE9211p3 | | | 1090927 | NZ_AHAU | ./rcn/refseq-NZ-1090927-.-.-NZ_AHAU-pE9211p3-Escherichia_coli_O104_H4_str._E92_11.fna | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
263 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
264 | [3 rows] | | | | | | | | | | | | | | | | | | | | | | | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
265 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
266 | ERR260489 | Kingella kingae KKC2005004457 | 1.0 | 400/400 | 5 | 0.0 | Bacteria; Proteobacteria; Betaproteobacteria; Neisseriales; Neisseriaceae; Kingella; kingae; KKC2005004457 | | Kingella kingae | Kingella | Neisseriaceae | Neisseriales | Betaproteobacteria | Proteobacteria | Bacteria | | | unnamed | | | 1229911 | | ./rcn/refseq-NG-1229911-.-.-.-unnamed-Kingella_kingae_KKC2005004457.fna | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
267 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
268 | ERR260489 | Bacteroides cellulosilyticus WH2 | 0.99984 | 399/400 | 772 | 0.0 | Bacteria; FCB group; Bacteroidetes/Chlorobi group; Bacteroidetes; Bacteroidia; Bacteroidales; Bacteroidaceae; Bacteroides; cellulosilyticus; WH2 | | Bacteroides cellulosilyticus | Bacteroides | Bacteroidaceae | Bacteroidales | Bacteroidia | Bacteroidetes | Bacteria | | | pBWH2B | | | 1268240 | NZ_ATFI | ./rcn/refseq-NZ-1268240-.-.-NZ_ATFI-pBWH2B-Bacteroides_cellulosilyticus_WH2.fna | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
269 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
270 | [1 row] | | | | | | | | | | | | | | | | | | | | | | | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
271 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
272 | ERR260489 | Klebsiella pneumoniae | 0.99984 | 399/400 | 4 | 0.0 | Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales; Enterobacteriaceae; Klebsiella; pneumoniae | | Klebsiella pneumoniae | Klebsiella | Enterobacteriaceae | Enterobacterales | Gammaproteobacteria | Proteobacteria | Bacteria | | | pMRC151 | | | 573 | | ./rcn/refseq-NG-573-.-.-.-pMRC151-Klebsiella_pneumoniae.fna | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
273 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
274 | [37 rows] | | | | | | | | | | | | | | | | | | | | | | | | | |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
275 +-----------+--------------------------------------+----------+----------------+----------------------+--------+--------------------------------------------------------------------------------------------------------------------------------------------------+-----------------------+------------------------------+------------------+--------------------+------------------+---------------------+-------------------+-------------------------+------------+---------+----------+------------+-----------+---------+---------------------+----------------------------------------------------------------------------------------------+--------------------------+----------------+ |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
276 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
277 Some of the top genomes contained in this sample are sorted by identity and median multiplicity are: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
278 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
279 - *Bacteroides fragilis* - fully contained (400/400) and high multiplicity (768) |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
280 - *Escherichia coli* O104:H4 - fully contained (400/400) and median multiplicity of 48 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
281 - *Kingella kingae* - fully contained (400/400) and median multiplicity of 5 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
282 - *Klebsiella pneumoniae* - 399/400 sketches contained with median multiplicity of 4 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
283 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
284 So with Mash we are able to find that the sample contained the expected genomic data (especially *E. coli* O104:H4). |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
285 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
286 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
287 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
288 Legal |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
289 ----- |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
290 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
291 Copyright Government of Canada 2017 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
292 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
293 Written by: National Microbiology Laboratory, Public Health Agency of Canada |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
294 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
295 Licensed under the Apache License, Version 2.0 (the "License"); you may not use |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
296 this work except in compliance with the License. You may obtain a copy of the |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
297 License at: |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
298 |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
299 www.apache.org/licenses/LICENSE-2.0 |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
300 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
301 Unless required by applicable law or agreed to in writing, software distributed |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
302 under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
303 CONDITIONS OF ANY KIND, either express or implied. See the License for the |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
304 specific language governing permissions and limitations under the License. |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
305 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
306 Contact |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
307 ------- |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
308 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
309 **Gary van Domselaar**: gary.vandomselaar@phac-aspc.gc.ca |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
310 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
311 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
312 |
1
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
313 .. _Mash: genomebiology.biomedcentral.com/articles/10.1186/s13059-016-0997-x |
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
314 .. _SAMEA1877340: www.ebi.ac.uk/ena/data/view/SAMEA1877340 |
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
315 .. _PRJEB1775: www.ebi.ac.uk/ena/data/view/PRJEB1775 |
2c1cb37a3ffe
planemo upload for repository https://github.com/phac-nml/refseq_masher commit e83730c5df84a960af58ff09db7eb09d11df2398
nml
parents:
0
diff
changeset
|
316 .. _ERR260489: www.ebi.ac.uk/ena/data/view/ERR260489&display=html |
0
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
317 |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
318 ]]> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
319 </help> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
320 <citations> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
321 <!-- Citation for Mash paper --> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
322 <citation type="doi">10.1186/s13059-016-0997-x</citation> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
323 </citations> |
26df66c32861
planemo upload commit 80c22275be05e29208e991019309dfffa9704f39
nml
parents:
diff
changeset
|
324 </tool> |