annotate tools/seq_filter_by_mapping/seq_filter_by_mapping.xml @ 2:48e71dfd51b3 draft

v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
author peterjc
date Wed, 10 May 2017 13:16:44 -0400
parents 8ff0ac66f1a3
children 481b0a925e66
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
1 <tool id="seq_filter_by_mapping" name="Filter sequences by mapping" version="0.0.5">
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
2 <description>from SAM/BAM file</description>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
3 <requirements>
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
4 <requirement type="package" version="1.67">biopython</requirement>
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
5 <requirement type="package" version="0.1.19">samtools</requirement>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
6 </requirements>
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
7 <version_command>
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
8 python $__tool_directory__/seq_filter_by_mapping.py --version
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
9 </version_command>
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
10 <command detect_errors="aggressive">
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
11 python $__tool_directory__/seq_filter_by_mapping.py -i '$input_file' -f '$input_file.ext' -m $pair_mode
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
12 #if $output_choice_cond.output_choice=="both"
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
13 -p '$output_pos' -n '$output_neg'
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
14 #elif $output_choice_cond.output_choice=="pos"
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
15 -p '$output_pos'
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
16 #elif $output_choice_cond.output_choice=="neg"
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
17 -n '$output_neg'
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
18 #end if
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
19 ## Now loop over all the mapping files
2
48e71dfd51b3 v0.0.5 Depend on Biopython 1.67 from Tool Shed or (Bio)conda
peterjc
parents: 1
diff changeset
20 #for i in $mapping_file#'${i}' #end for#
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
21 </command>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
22 <inputs>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
23 <param name="input_file" type="data" format="fasta,fastq,sff" label="Sequence file to be filtered" help="FASTA, FASTQ, or SFF format." />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
24 <param name="mapping_file" type="data" format="sam,bam" multiple="true" label="SAM/BAM mapping of those sequences" help="SAM or BAM format." />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
25 <conditional name="output_choice_cond">
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
26 <param name="output_choice" type="select" label="Output mapped reads, unmapped reads, or both?">
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
27 <option value="both">Both mapped and unmapped reads, as two files</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
28 <option value="pos">Just mapped reads, as a single file</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
29 <option value="neg">Just unmapped reads, as a single file</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
30 </param>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
31 <!-- Seems need these dummy entries here, compare this to indels/indel_sam2interval.xml -->
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
32 <when value="both" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
33 <when value="pos" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
34 <when value="neg" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
35 </conditional>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
36 <param name="pair_mode" type="select" label="Paired read treatment">
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
37 <option value="lax" selected="true">Treat as a pair, allow either read to be mapped</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
38 <option value="strict">Treat as a pair, require both reads to be mapped</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
39 <!-- The following would actually be more work as have to store qname/1 and qname/2 separately for filter...
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
40 <option value="solo">Treat independently (will split partners when only one maps)</option>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
41 -->
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
42 </param>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
43 </inputs>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
44 <outputs>
1
8ff0ac66f1a3 v0.0.4; Report FASTQ counts; misc internal changes
peterjc
parents: 0
diff changeset
45 <data name="output_pos" format_source="input_file" metadata_source="input_file" label="$input_file.name (mapped)">
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
46 <filter>output_choice_cond["output_choice"] != "neg"</filter>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
47 </data>
1
8ff0ac66f1a3 v0.0.4; Report FASTQ counts; misc internal changes
peterjc
parents: 0
diff changeset
48 <data name="output_neg" format_source="input_file" metadata_source="input_file" label="$input_file.name (unmapped)">
0
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
49 <filter>output_choice_cond["output_choice"] != "pos"</filter>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
50 </data>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
51 </outputs>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
52 <tests>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
53 <test>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
54 <param name="input_file" value="SRR639755_mito_pairs.fastq.gz" ftype="fastqsanger" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
55 <param name="mapping_file" value="SRR639755_sample_by_coord.sam" ftype="sam" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
56 <param name="pair_mode" value="lax" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
57 <param name="output_choice" value="pos" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
58 <output name="output_pos" file="SRR639755_sample_lax.fastq" ftype="fastqsanger" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
59 </test>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
60 <test>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
61 <param name="input_file" value="SRR639755_mito_pairs.fastq.gz" ftype="fastqsanger" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
62 <param name="mapping_file" value="SRR639755_sample_by_coord.sam" ftype="sam" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
63 <param name="pair_mode" value="strict" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
64 <param name="output_choice" value="pos" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
65 <output name="output_pos" file="SRR639755_sample_strict.fastq" ftype="fastqsanger" />
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
66 </test>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
67 </tests>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
68 <help>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
69 **What it does**
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
70
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
71 By default it divides a FASTA, FASTQ or Standard Flowgram Format (SFF) file in
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
72 two, those sequences (or read pairs) which do or don't map in the provided
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
73 SAM/BAM file. You can opt to have a single output file of just the mapping reads,
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
74 or just the non-mapping ones.
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
75
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
76 **Example Usage**
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
77
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
78 You might wish to perform a contamination screan by mapping your reads against
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
79 known contaminant reference sequences, then use this tool to select only the
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
80 unmapped reads for further analysis (e.g. *de novo* assembly).
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
81
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
82 Similarly you might wish to map your reads against a known bacterial reference,
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
83 then take the non-mapping sequences forward for analysis if looking for novel
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
84 plasmids.
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
85
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
86
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
87 **References**
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
88
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
89 If you use this Galaxy tool in work leading to a scientific publication please
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
90 cite:
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
91
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
92 Peter J.A. Cock (2014), Galaxy tool for filtering reads by mapping
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
93 http://toolshed.g2.bx.psu.edu/view/peterjc/seq_filter_by_mapping
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
94
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
95 This tool uses Biopython to read and write SFF files, so you may also wish to
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
96 cite the Biopython application note (and Galaxy too of course):
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
97
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
98 Cock et al (2009). Biopython: freely available Python tools for computational
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
99 molecular biology and bioinformatics. Bioinformatics 25(11) 1422-3.
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
100 http://dx.doi.org/10.1093/bioinformatics/btp163 pmid:19304878.
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
101
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
102 This tool is available to install into other Galaxy Instances via the Galaxy
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
103 Tool Shed at http://toolshed.g2.bx.psu.edu/view/peterjc/seq_filter_by_mapping
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
104 </help>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
105 <citations>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
106 <citation type="doi">10.1093/bioinformatics/btp163</citation>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
107 </citations>
1d773da0ccf0 Uploaded v0.0.2, fixed some error messages
peterjc
parents:
diff changeset
108 </tool>