Mercurial > repos > iuc > porechop
comparison porechop.xml @ 0:24822689acf8 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/porechop commit b8cc84454aedcdbe22d385c1d7067fab599b9090
author | iuc |
---|---|
date | Tue, 18 Sep 2018 16:24:49 -0400 |
parents | |
children | 93d623d9979c |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:24822689acf8 |
---|---|
1 <tool id="porechop" name="Porechop" version="0.2.3"> | |
2 <description>adapter trimmer for Oxford Nanopore reads</description> | |
3 <requirements> | |
4 <requirement type="package" version="0.2.3_seqan2.1.1">porechop</requirement> | |
5 </requirements> | |
6 <version_command>porechop --version</version_command> | |
7 <command detect_errors="exit_code"><![CDATA[ | |
8 porechop | |
9 -i '$input_file' | |
10 --format '$format' | |
11 --barcode_threshold '$barcode_binning_settings.barcode_threshold' | |
12 --barcode_diff '$barcode_binning_settings.barcode_diff' | |
13 $barcode_binning_settings.require_two_barcodes | |
14 $barcode_binning_settings.discard_unassigned | |
15 --adapter_threshold '$adapter_search_settings.adapter_threshold' | |
16 --check_reads '$adapter_search_settings.check_reads' | |
17 --scoring_scheme '$adapter_search_settings.scoring_scheme' | |
18 --end_size '$end_adapter_settings.end_size' | |
19 --min_trim_size '$end_adapter_settings.min_trim_size' | |
20 --extra_end_trim '$end_adapter_settings.extra_end_trim' | |
21 --end_threshold '$end_adapter_settings.end_threshold' | |
22 $middle_adapter_settings.no_split | |
23 $middle_adapter_settings.discard_middle | |
24 --middle_threshold '$middle_adapter_settings.middle_threshold' | |
25 --extra_middle_trim_good_side '$middle_adapter_settings.extra_middle_trim_good_side' | |
26 --extra_middle_trim_bad_side '$middle_adapter_settings.extra_middle_trim_bad_side' | |
27 --min_split_read_size '$middle_adapter_settings.min_split_read_size' | |
28 -o 'out.$format' | |
29 | |
30 ]]></command> | |
31 <inputs> | |
32 <param name="input_file" type="data" format="fasta,fastq" label="Input FASTA/FASTQ" help="FASTA/FASTQ of input reads" /> | |
33 <param name="format" type="select" label="Output format for the reads" help="Output format for the reads - if auto, the format will be chosen based on the output filename or the input read format"> | |
34 <option selected="True" value="fasta">FASTA</option> | |
35 <option value="fastq">FASTQ</option> | |
36 <option value="fasta.gz">FASTA.gz</option> | |
37 <option value="fastq.gz">FASTQ.gz</option> | |
38 </param> | |
39 <section name="barcode_binning_settings" title="Barcode binning settings"> | |
40 <param argument="--barcode_threshold" type="float" min="0" max="100" value="75.0" optional="True" label="Percent identity for binning" | |
41 help="A read must have at least this percent identity to a barcode to be binned (default: 75.0)"/> | |
42 <param argument="--barcode_diff" type="float" min="0" max="100" value="5.0" optional="True" label="Minimum difference in identity" | |
43 help="If the difference between a read's best barcode identity and its second-best barcode identity is less than this value, it will not be put in a barcode bin (to exclude cases which are too close to call) (default: 5.0)"/> | |
44 <param argument="--require_two_barcodes" type="boolean" checked="false" truevalue="--require_two_barcodes" falsevalue="" label="Require two matches for binning" | |
45 help="Reads will only be put in barcode bins if they have a strong match for the barcode on both their start and end (default: a read can be binned with a match at its start or end)"/> | |
46 <param argument="--discard_unassigned" type="boolean" checked="false" truevalue="--discard_unassigned" falsevalue="" label="Discard unassigned reads" | |
47 help="Discard unassigned reads (instead of creating a 'none' bin) (default: False)"/> | |
48 </section> | |
49 <section name="adapter_search_settings" title="Adapter search settings"> | |
50 <param argument="--adapter_threshold" type="float" min="0" max="100" value="90.0" optional="True" label="Minimum identity" | |
51 help="An adapter set has to have at least this percent identity to be labelled as present and trimmed off (0 to 100) (default: 90.0)"/> | |
52 <param argument="--check_reads" type="integer" min="0" value="10000" optional="True" label="Number of alligned reads" | |
53 help="This many reads will be aligned to all possible adapters to determine which adapter sets are present (default: 10000)"/> | |
54 <param argument="--scoring_scheme" type="text" value="3,-6,-5,-2" label="Scoring scheme" | |
55 help="Comma-delimited string of alignment scores: match, mismatch, gap open, gap extend"> | |
56 <validator type="regex" message="Scoring scheme must be comma-separated string of four positive/negative integers">^((-?\d+[,]){3})-?\d+$</validator> | |
57 </param> | |
58 </section> | |
59 <section name="end_adapter_settings" title="End adapter settings"> | |
60 <param argument="--end_size" type="integer" min="0" value="150" optional="True" label="Number of bases" | |
61 help="The number of base pairs at each end of the read which will be searched for adapter sequences (default: 150)"/> | |
62 <param argument="--min_trim_size" type="integer" min="0" value="4" optional="True" label="Minimum trim length" | |
63 help="Adapter alignments smaller than this will be ignored (default: 4)"/> | |
64 <param argument="--extra_end_trim" type="integer" min="0" value="2" optional="True" label="Extra bases trimmed" | |
65 help="This many additional bases will be removed next to adapters found at the ends of reads (default: 2)"/> | |
66 <param argument="--end_threshold" type="float" min="0" max="100" value="75.0" optional="True" label="Minimum percent identity" | |
67 help="Adapters at the ends of reads must have at least this percent identity to be removed (0 to 100) (default: 75.0)"/> | |
68 </section> | |
69 <section name="middle_adapter_settings" title="Middle adapter settings"> | |
70 <param argument="--no_split" type="boolean" checked="false" truevalue="--no_split" falsevalue="" label="Skip splitting" | |
71 help="Skip splitting reads based on middle adapters (default: split reads when an adapter is found in the middle)"/> | |
72 <param argument="--discard_middle" type="boolean" checked="false" truevalue="--discard_middle" falsevalue="" label="Discard reads with middle adapter" | |
73 help="Reads with middle adapters will be discarded (default: reads with middle adapters are split) (required for reads to be used with Nanopolish, this option is on by default when outputting reads into barcode bins)"/> | |
74 <param argument="--middle_threshold" type="float" min="0" max="100" value="85.0" optional="True" label="Minimum percent identity" | |
75 help="Adapters in the middle of reads must have at least this percent identity to be found (0 to 100) (default: 85.0)"/> | |
76 <param argument="--extra_middle_trim_good_side" type="integer" min="0" value="10" optional="True" label="Extra trimming good side" | |
77 help="This many additional bases will be removed next to middle adapters on their 'good' side (default: 10)"/> | |
78 <param argument="--extra_middle_trim_bad_side" type="integer" min="0" value="100" optional="True" label="Extra trimming bad side" | |
79 help="This many additional bases will be removed next to middle adapters on their 'bad' side (default: 100)"/> | |
80 <param argument="--min_split_read_size" type="integer" min="0" value="1000" optional="True" label="Minimum length reads post-split" | |
81 help="Post-split read pieces smaller than this many base pairs will not be outputted (default: 1000)"/> | |
82 </section> | |
83 </inputs> | |
84 <outputs> | |
85 <data name="outfile" format="fasta" from_work_dir="out.*" label="${tool.name} on ${on_string}: Trimmed"> | |
86 <change_format> | |
87 <when input="format" value="fastq" format="fastq"/> | |
88 <when input="format" value="fasta.gz" format="fasta.gz"/> | |
89 <when input="format" value="fastq.gz" format="fastq.gz"/> | |
90 </change_format> | |
91 </data> | |
92 </outputs> | |
93 <tests> | |
94 <test> | |
95 <param name="input_file" ftype="fasta" value="test_format.fasta"/> | |
96 <param name="format" value="fasta"/> | |
97 <output name="outfile" ftype="fasta" file="out.fasta"/> | |
98 </test> | |
99 <test> | |
100 <param name="input_file" ftype="fasta" value="test_format.fasta"/> | |
101 <param name="format" value="fastq"/> | |
102 <output name="outfile" ftype="fastq" file="out.fastq"/> | |
103 </test> | |
104 <test> | |
105 <param name="input_file" ftype="fasta" value="test_format.fasta"/> | |
106 <param name="format" value="fasta.gz"/> | |
107 <output name="outfile" ftype="fasta.gz" file="out.fasta.gz" compare="sim_size"/> | |
108 </test> | |
109 <test> | |
110 <param name="input_file" ftype="fasta" value="test_format.fasta"/> | |
111 <param name="format" value="fastq.gz"/> | |
112 <output name="outfile" ftype="fastq.gz" file="out.fastq.gz" compare="sim_size"/> | |
113 </test> | |
114 <test> | |
115 <param name="input_file" ftype="fasta" value="test_format.fasta"/> | |
116 <param name="format" value="fasta"/> | |
117 <param name="barcode_threshold" value="70"/> | |
118 <param name="barcode_diff" value="4"/> | |
119 <param name="require_two_barcodes" value="True"/> | |
120 <param name="discard_unassigned" value="True"/> | |
121 <param name="end_size" value="100"/> | |
122 <param name="min_trim_size" value="2"/> | |
123 <param name="extra_end_trim" value="1"/> | |
124 <param name="end_threshold" value="80"/> | |
125 <param name="discard_middle" value="True"/> | |
126 <param name="middle_threshold" value="90"/> | |
127 <param name="extra_middle_trim_good_size" value="3"/> | |
128 <param name="extra_middle_trim_bad_size" value="30"/> | |
129 <param name="min_split_read_size" value="1500"/> | |
130 <output name="outfile" ftype="fasta" file="out_advanced.fasta"/> | |
131 </test> | |
132 </tests> | |
133 <help><![CDATA[ | |
134 Porechop is a tool for finding and removing adapters from Oxford Nanopore reads. | |
135 Adapters on the ends of reads are trimmed off, and when a read has an adapter in | |
136 its middle, it is treated as chimeric and chopped into separate reads. Porechop | |
137 performs thorough alignments to effectively find adapters, even at low sequence identity. | |
138 | |
139 Porechop also supports demultiplexing of Nanopore reads that were barcoded with | |
140 the Native Barcoding Kit, PCR Barcoding Kit or Rapid Barcoding Kit. | |
141 ]]></help> | |
142 <citations> | |
143 <citation type="bibtex"> | |
144 @misc{rrwick2017, | |
145 author = {Wick, Ryan}, | |
146 year = {2017}, | |
147 title = {Porechop}, | |
148 publisher = {GitHub}, | |
149 journal = {GitHub repository}, | |
150 url = {https://github.com/rrwick/Porechop}, | |
151 } | |
152 </citation> | |
153 </citations> | |
154 </tool> |