Mercurial > repos > lparsons > fastx_barcode_splitter_enhanced
comparison fastx_barcode_splitter.xml @ 4:0fb7e9130a70 draft default tip
planemo upload for repository https://github.com/lparsons/galaxy_tools/tree/master/tools/fastx_barcode_splitter_enhanced commit 460463a5406419fe8e113467bdb8bd093d21e7c5
author | lparsons |
---|---|
date | Mon, 02 May 2016 17:04:32 -0400 |
parents | e7b7cdc1834d |
children |
comparison
equal
deleted
inserted
replaced
3:e7b7cdc1834d | 4:0fb7e9130a70 |
---|---|
1 <tool id="cshl_princeton_fastx_barcode_splitter" version="1.1" name="Barcode Splitter"> | 1 <tool id="cshl_princeton_fastx_barcode_splitter" version="1.2" name="Barcode Splitter"> |
2 <description></description> | 2 <description></description> |
3 <command interpreter="bash"><![CDATA[ | 3 <command interpreter="bash" detect_errors="aggressive"><![CDATA[ |
4 fastx_barcode_splitter_galaxy_wrapper.sh $BARCODE $input "split/" $input.extension --mismatches $mismatches --partial $partial | 4 fastx_barcode_splitter_galaxy_wrapper.sh $BARCODE $input "split/" $input.extension --mismatches $mismatches --partial $partial |
5 #if $refBarcodeLocation.barcodeLocation == "idxfile": | 5 #if $refBarcodeLocation.barcodeLocation == "idxfile": |
6 --idxfile $refBarcodeLocation.idxfile | 6 --idxfile $refBarcodeLocation.idxfile |
7 #else: | 7 #else: |
8 $refBarcodeLocation.EOL | 8 $refBarcodeLocation.EOL |
9 #end if | 9 #end if |
10 > $output | 10 > $summary |
11 ]]> | 11 ]]> |
12 </command> | 12 </command> |
13 | 13 |
14 <inputs> | 14 <inputs> |
15 <param format="txt" name="BARCODE" type="data" label="Barcodes to use" /> | 15 <param format="txt" name="BARCODE" type="data" label="Barcodes to use" /> |
16 <param format="fasta,fastqsanger,fastqsolexa,fastqillumina" name="input" type="data" label="Library to split" /> | 16 <param format="fasta,fastq,fastqsanger,fastqsolexa,fastqillumina" name="input" type="data" label="Library to split" /> |
17 | 17 |
18 <conditional name="refBarcodeLocation"> | 18 <conditional name="refBarcodeLocation"> |
19 <param name="barcodeLocation" type="select" label="Barcodes found at"> | 19 <param name="barcodeLocation" type="select" label="Barcodes found at"> |
20 <option value="bol">Start of sequence (5' end)</option> | 20 <option value="bol">Start of sequence (5' end)</option> |
21 <option value="eol">End of sequence (3' end)</option> | 21 <option value="eol">End of sequence (3' end)</option> |
22 <option value="idxfile">Separate index file</option> | 22 <option value="idxfile">Separate index file</option> |
23 </param> | 23 </param> |
24 <when value="bol"> | 24 <when value="bol"> |
25 <param name="EOL" type="hidden" value="--bol" /> | 25 <param name="EOL" type="hidden" value="--bol" /> |
26 </when> | 26 </when> |
27 <when value="eol"> | 27 <when value="eol"> |
28 <param name="EOL" type="hidden" value="--eol" /> | 28 <param name="EOL" type="hidden" value="--eol" /> |
29 </when> | 29 </when> |
30 <when value="idxfile"> | 30 <when value="idxfile"> |
31 <param name="idxfile" type="data" format="fasta,fastq,fastqsanger" label="Select index read file" /> | 31 <param name="idxfile" type="data" format="fasta,fastq,fastqsanger" label="Select index read file" /> |
32 </when> | 32 </when> |
33 </conditional> | 33 </conditional> |
34 | 34 |
35 <param name="mismatches" type="integer" size="3" value="0" label="Number of allowed mismatches" /> | 35 <param name="mismatches" type="integer" size="3" value="0" label="Number of allowed mismatches" /> |
36 | 36 |
37 <param name="partial" type="integer" size="3" value="0" label="Number of allowed barcodes nucleotide deletions" /> | 37 <param name="partial" type="integer" size="3" value="0" label="Number of allowed barcodes nucleotide deletions" /> |
38 | 38 |
39 </inputs> | 39 </inputs> |
40 | 40 |
41 <outputs> | 41 <outputs> |
42 <data format="html" name="output"> | 42 <data format="tabular" name="summary" label="${tool.name} on ${on_string}: Summary" /> |
43 <discover_datasets pattern="__designation_and_ext__" directory="split" visible="true" label="${tool.name}: ${designation}"/> | 43 <collection name="split_output" type="list" format_source="input" label="${tool.name} on ${on_string}"> |
44 </data> | 44 <discover_datasets pattern="__designation_and_ext__" directory="split" visible="false" label="${designation}"/> |
45 </outputs> | 45 </collection> |
46 </outputs> | |
46 | 47 |
47 <tests> | 48 <tests> |
48 <test> | 49 <test> |
49 <!-- Split a FASTQ file --> | 50 <!-- Split a FASTQ file --> |
50 <param name="BARCODE" value="fastx_barcode_splitter1.txt" /> | 51 <param name="BARCODE" value="fastx_barcode_splitter1.txt" /> |
51 <param name="input" value="fastx_barcode_splitter1.fastq" ftype="fastqsolexa" /> | 52 <param name="input" value="fastx_barcode_splitter1.fastq" ftype="fastqsolexa" /> |
52 <param name="barcodeLocation" value="bol" /> | 53 <param name="barcodeLocation" value="bol" /> |
53 <param name="mismatches" value="2" /> | 54 <param name="mismatches" value="2" /> |
54 <param name="partial" value="0" /> | 55 <param name="partial" value="0" /> |
55 <output name="output" file="fastx_barcode_splitter1.out"> | 56 <output name="summary" file="fastx_barcode_splitter1.out" /> |
56 <discovered_dataset designation="BC1" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC1.out" /> | 57 <collection name="output" type="list"> |
57 <discovered_dataset designation="BC2" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC2.out" /> | 58 <discovered_dataset designation="BC1" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC1.out" /> |
58 <discovered_dataset designation="BC3" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC3.out" /> | 59 <discovered_dataset designation="BC2" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC2.out" /> |
59 <discovered_dataset designation="BC4" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC4.out" /> | 60 <discovered_dataset designation="BC3" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC3.out" /> |
60 <discovered_dataset designation="unmatched" ftype="fastqsolexa" file="fastx_barcode_splitter1_unmatched.out" /> | 61 <discovered_dataset designation="BC4" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC4.out" /> |
61 </output> | 62 <discovered_dataset designation="unmatched" ftype="fastqsolexa" file="fastx_barcode_splitter1_unmatched.out" /> |
62 </test> | 63 </collection> |
63 <test> | 64 </test> |
64 <!-- Split a FASTQ file, using separate index read --> | 65 |
65 <param name="BARCODE" value="fastx_barcode_splitter1.txt" /> | 66 <test> |
66 <param name="input" value="fastx_barcode_splitter1.fastq" ftype="fastqsolexa" /> | 67 <!-- Split a FASTQ file, using separate index read --> |
67 <param name="idxfile" value="fastx_barcode_splitter_index.fastq" ftype="fastqsolexa" /> | 68 <param name="BARCODE" value="fastx_barcode_splitter1.txt" /> |
68 <param name="barcodeLocation" value="idxfile" /> | 69 <param name="input" value="fastx_barcode_splitter1.fastq" ftype="fastqsolexa" /> |
69 <param name="mismatches" value="2" /> | 70 <param name="idxfile" value="fastx_barcode_splitter_index.fastq" ftype="fastqsolexa" /> |
70 <param name="partial" value="0" /> | 71 <param name="barcodeLocation" value="idxfile" /> |
71 <output name="output" file="fastx_barcode_splitter1.out"> | 72 <param name="mismatches" value="2" /> |
72 <discovered_dataset designation="BC1" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC1.out" /> | 73 <param name="partial" value="0" /> |
73 <discovered_dataset designation="BC2" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC2.out" /> | 74 <output name="output" file="fastx_barcode_splitter1.out" /> |
74 <discovered_dataset designation="BC3" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC3.out" /> | 75 <collection name="split_output" type="list"> |
75 <discovered_dataset designation="BC4" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC4.out" /> | 76 <discovered_dataset designation="BC1" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC1.out" /> |
76 <discovered_dataset designation="unmatched" ftype="fastqsolexa" file="fastx_barcode_splitter1_unmatched.out" /> | 77 <discovered_dataset designation="BC2" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC2.out" /> |
77 </output> | 78 <discovered_dataset designation="BC3" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC3.out" /> |
78 </test> | 79 <discovered_dataset designation="BC4" ftype="fastqsolexa" file="fastx_barcode_splitter1_BC4.out" /> |
79 </tests> | 80 <discovered_dataset designation="unmatched" ftype="fastqsolexa" file="fastx_barcode_splitter1_unmatched.out" /> |
81 </collection> | |
82 </test> | |
83 </tests> | |
80 | 84 |
81 <help><![CDATA[ | 85 <help><![CDATA[ |
82 **What it does** | 86 **What it does** |
83 | 87 |
84 This tool splits a FASTQ or FASTA file into several files, using barcodes as the split criteria. | 88 This tool splits a FASTQ or FASTA file into several files, using barcodes as the split criteria. |
90 Barcode files are simple text files. | 94 Barcode files are simple text files. |
91 Each line should contain an identifier (descriptive name for the barcode), and the barcode itself (A/C/G/T), separated by a TAB character. | 95 Each line should contain an identifier (descriptive name for the barcode), and the barcode itself (A/C/G/T), separated by a TAB character. |
92 Example:: | 96 Example:: |
93 | 97 |
94 #This line is a comment (starts with a 'number' sign) | 98 #This line is a comment (starts with a 'number' sign) |
95 BC1 GATCT | 99 BC1 GATCT |
96 BC2 ATCGT | 100 BC2 ATCGT |
97 BC3 GTGAT | 101 BC3 GTGAT |
98 BC4 TGTCT | 102 BC4 TGTCT |
99 | 103 |
100 For each barcode, a new FASTQ file will be created (with the barcode's identifier as part of the file name). | 104 For each barcode, a new FASTQ file will be created (with the barcode's identifier as part of the file name). |
101 Sequences matching the barcode will be stored in the appropriate file. | 105 Sequences matching the barcode will be stored in the appropriate file. |
102 | 106 |
103 One additional FASTQ file will be created (the 'unmatched' file), where sequences not matching any barcode will be stored. | 107 One additional FASTQ file will be created (the 'unmatched' file), where sequences not matching any barcode will be stored. |
104 | 108 |
105 The output of this tool is an HTML file, displaying the split counts and the file names. | 109 The output of this tool is a summary tabel displaying the split counts for each barcode identifier. |
106 In addition, each fastq file produced will be loaded into the galaxy history automatically. | 110 In addition, each fastq file produced will be loaded into the galaxy history as part of a collection list. |
107 ]]> | 111 ]]> |
108 </help> | 112 </help> |
109 | 113 |
110 <!-- FASTX-barcode-splitter is part of the FASTX-toolkit, by A.Gordon (gordon@cshl.edu) --> | 114 <!-- FASTX-barcode-splitter is part of the FASTX-toolkit, by A.Gordon (gordon@cshl.edu) --> |
111 <citations> | 115 <citations> |
112 <citation type="bibtex"> | 116 <citation type="bibtex"> |
113 @misc{gordon_fastx-toolkit_????, | 117 @misc{gordon_fastx-toolkit_????, |
114 title = {{FASTX}-{Toolkit}}, | 118 title = {{FASTX}-{Toolkit}}, |
115 url = {http://hannonlab.cshl.edu/fastx_toolkit/index.html}, | 119 url = {http://hannonlab.cshl.edu/fastx_toolkit/index.html}, |
116 author = {Gordon, Assaf} | 120 author = {Gordon, Assaf} |
117 } | 121 } |
118 </citation> | 122 </citation> |
119 </citations> | 123 </citations> |
120 | 124 |
121 </tool> | 125 </tool> |