annotate umi-tools_counts.xml @ 3:b557acca0b56 draft

planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
author iuc
date Fri, 20 Jul 2018 03:50:03 -0400
parents 3c932ad4a174
children 70cb5527defb
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
1 <tool id="umi_tools_count" name="UMI-tools count" version="@VERSION@.2">
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
2 <description>performs quantification of UMIs from BAM files</description>
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
3 <macros>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
4 <import>macros.xml</import>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
5 <xml name="sanitize_tag" >
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
6 <sanitizer invalid_char="">
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
7 <valid initial="string.letters,string.digits" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
8 </sanitizer>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
9 </xml>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
10 </macros>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
11 <expand macro="requirements" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
12 <command detect_errors="exit_code"><![CDATA[
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
13 #import re
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
14
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
15 ln -s '${input_bam}' 'input.bam' &&
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
16 ln -s '${input_bam.metadata.bam_index}' 'input.bam.bai' &&
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
17
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
18 umi_tools count
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
19 -I input.bam
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
20 '$paired'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
21 --extract-umi-method='$barcodes.extract_umi_method.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
22 #if str($barcodes.extract_umi_method) == 'read_id':
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
23 --umi-separator='$barcodes.umi_separator.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
24 #else if str($barcodes.extract_umi_method) == 'tag':
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
25 --umi-tag='$barcodes.umi_tag.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
26 --cell-tag='$barcodes.cell_tag.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
27 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
28 --method='$method.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
29 --edit-distance-threshold='$edit_distance_threshold'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
30 --mapping-quality='$advanced.mapping_quality'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
31 --per-gene
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
32 '$wide_format_cell_counts'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
33 '$advanced.per_contig'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
34 '$advanced.per_cell'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
35
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
36 #if str($advanced.gene_tag) != "":
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
37 --gene-tag='$advanced.gene_tag.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
38 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
39 #if str($advanced.skip_tags_regex) != "":
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
40 --skip-tags-regex='$advanced.skip_tags_regex.value'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
41 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
42 #if '$advanced.random_seed' != 0:
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
43 --random-seed='$advanced.random_seed'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
44 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
45 -S '$out_counts'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
46
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
47
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
48 #if str($cond_extra.prepender) != "none":
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
49 #set $replacer = re.sub('[^\w\_]+', '_', str($input_bam.element_identifier.rsplit('.',1)[0]))
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
50 #if str($cond_extra.prepender) == "string":
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
51 #set $replacer = str($cond_extra.custom_label)
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
52 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
53
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
54 && sed -i -r '1s|\b([ACGT]+)\b|'"$replacer"'_\1|g' '$out_counts'
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
55 #end if
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
56
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
57 ]]></command>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
58 <inputs>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
59 <param name="input_bam" type="data" format="bam" label="Sorted BAM file" help="Please use the samtools sort tool to ensure a correct BAM input" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
60 <param argument="--paired" type="boolean" truevalue="--paired" falsevalue="" checked="false" label="Bam is paired-end" help="both read pairs will be output. This will also force the use of the template length to determine reads with the same mapping coordinates." />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
61 <conditional name="barcodes" >
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
62 <param argument="--extract-umi-method" name="extract_umi_method" type="select" label="Umi Extract Method" help="How are the barcodes encoded in the read?" >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
63 <option value="read_id" selected="true">Barcodes are contained at the end of the read seperated by a delimiter</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
64 <option value="tag" >Barcodes are contained in tags</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
65 <option value="umis" >Barcodes were extracted using umis</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
66 </param>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
67 <when value="read_id" >
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
68 <param argument="--umi-separator" name="umi_separator" type="text" label="Delimiter between read id and the UMI" value="_" >
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
69 <sanitizer invalid_char="" >
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
70 <valid initial="string.punctuation" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
71 </sanitizer>
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
72 </param>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
73 </when>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
74 <when value="tag" >
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
75 <param argument="--umi-tag" name="umi_tag" type="text" label="Tag which contains the UMI" >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
76 <expand macro="sanitize_tag" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
77 </param>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
78 <param argument="--cell-tag" name="cell_tag" type="text" label="Tag which contains the cell barcode" >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
79 <expand macro="sanitize_tag" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
80 </param>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
81 </when>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
82 <when value="umis"></when>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
83 </conditional>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
84 <param argument="--method" type="select" label="Method to identify group of reads" help="UMIs with the same (or similar) codes can be grouped together. The simplest methods 'unique' and 'percentile' group identical
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
85 UMIs, however 'cluster', 'adjacency', and 'directional' can group similar umis with edit distances less than some threshold. Unique: Reads group share the exact same UMI. Percentile: Reads group share the same UMI, and UMIs with
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
86 counts &lt; 1% of the median counts for UMIs at the same position are ignored. Cluster: Identify clusters of connected UMIs (based on hamming distance threshold). Adjacency: Same as cluster, but considers only directly ajacent UMIs in the cluster. Directional: Identify cluster of connected UMIs based on hamming distance and umi." >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
87 <option value="unique" >Unique</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
88 <option value="percentile">Percentile</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
89 <option value="cluster">Cluster</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
90 <option value="adjacency">Adjacency</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
91 <option value="directional" selected="true" >Directional</option>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
92 </param>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
93 <param argument="--edit-distance-threshold" name="edit_distance_threshold" type="integer" label="Edit distance threshold" min="0" value="1" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
94 <param argument="--wide-format-cell-counts" name="wide_format_cell_counts" type="boolean" truevalue="--wide-format-cell-counts" falsevalue="" checked="true" label="Output a matrix of genes and cells, instead of a flat file" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
95 <section name="advanced" title="Extra parameters" >
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
96 <param argument="--mapping-quality" name="mapping_quality" type="integer" min="0" value="0" label="Minimum mapping quality" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
97 <!-- Currently hard-coded parameter. Leave here if useful to future wrapper -->
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
98 <!-- <param argument="-\-per-gene" name="per_gene" type="text" label="Group reads together if they have the same gene" help="Reads will be grouped together if they have the same gene. This is useful if your library
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
99 prep generates PCR duplicates with non-identical alignment positions such as CEL-Seq. Note this option is hardcoded to be on with the count command. I.e counting is always performed per-gene. Must be combined with either
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
100 -\-gene-tag or -\-per-contig option" /> -->
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
101 <param argument="--gene-tag" name="gene_tag" type="text" label="Deduplicate per gene." value="XT" help="The gene information is encoded in the bam read tag." >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
102 <expand macro="sanitize_tag" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
103 </param>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
104 <param argument="--skip-tags-regex" name="skip_tags_regex" type="text" label="Skip any reads where the gene matches this tag" value="" >
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
105 <sanitizer invalid_char="">
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
106 <valid initial="string.letters,string.digits">
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
107 <add value="!="/>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
108 <add value="-"/>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
109 <add value="_"/>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
110 <add value="."/>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
111 <add value="?"/>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
112 <add value="&lt;"/><!-- left triangle bracket -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
113 <add value="&gt;"/><!-- right triangle bracket -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
114 <add value="&#91;"/> <!-- left square bracket -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
115 <add value="&#93;"/> <!-- right square bracket -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
116 <add value="&#94;"/> <!-- caret -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
117 <add value="&#123;"/> <!-- left curly -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
118 <add value="&#125;"/> <!-- right curly -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
119 <add value="&#40;"/> <!-- left parenthesis -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
120 <add value="&#41;"/> <!-- right parenthesis -->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
121 </valid>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
122 </sanitizer>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
123 </param>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
124 <param argument="--per-contig" name="per_contig" type="boolean" truevalue="--per-contig" falsevalue="" checked="false" label="Deduplicate per contig (field 3 in BAM; RNAME)" help="All reads with the same contig will be considered to have the same alignment position. This is useful if you have aligned to a reference transcriptome with one transcript per gene." />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
125 <param argument="--per-cell" name="per_cell" type="boolean" truevalue="--per-cell" falsevalue="" checked="true" label="Group reads only if they have the same cell barcode." />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
126 <param argument="--random-seed" name="random_seed" type="integer" min="0" value="0" label="Random Seed" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
127 </section>
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
128 <conditional name="cond_extra" >
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
129 <param name="prepender" type="select" label="Prepend a label to all column headers" help="This preserves uniqueness when merging with other files with the same headers. Note: filename must not contain a '.' character" >
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
130 <option value="none" selected="true" >No modifications</option>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
131 <option value="string">Custom Label</option>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
132 <option value="dataset name">Dataset Name</option>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
133 </param>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
134 <when value="none"></when>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
135 <when value="dataset name"></when>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
136 <when value="string">
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
137 <param name="custom_label" type="text" label="Label to Prepend" >
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
138 <sanitizer invalid_char="">
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
139 <valid initial="string.letters,string.digits">
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
140 <add value="-"/>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
141 <add value="_"/>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
142 <add value="."/>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
143 </valid>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
144 </sanitizer>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
145 </param>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
146 </when>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
147 </conditional>
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
148 </inputs>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
149 <outputs>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
150 <data name="out_counts" format="tabular" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
151 </outputs>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
152 <tests>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
153 <test><!--count_single_gene_tag:-->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
154 <param name="input_bam" value="chr19_gene_tags.bam" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
155 <param name="random_seed" value="123456789" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
156 <param name="method" value="directional" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
157 <param name="gene_tag" value="XF" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
158 <param name="skip_tags_regex" value="^[__|Unassigned]" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
159 <param name="extract_umi_method" value="umis" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
160 <param name="wide_format_cell_counts" value="false" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
161 <param name="per_cell" value="false" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
162 <output name="out_counts" value="count_single_gene_tag.tsv" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
163 </test>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
164 <test><!--count_single_cells_gene_tag:-->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
165 <param name="input_bam" value="chr19_gene_tags.bam" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
166 <param name="random_seed" value="123456789" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
167 <param name="method" value="directional" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
168 <param name="gene_tag" value="XF" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
169 <param name="skip_tags_regex" value="^[__|Unassigned]" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
170 <param name="per_cell" value="true" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
171 <param name="extract_umi_method" value="umis" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
172 <param name="wide_format_cell_counts" value="false" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
173 <output name="out_counts" value="count_single_cells_gene_tag.tsv" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
174 </test>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
175 <test><!--count_single_cells_wide_gene_tag:-->
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
176 <param name="input_bam" value="chr19_gene_tags.bam" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
177 <param name="random_seed" value="123456789" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
178 <param name="method" value="directional" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
179 <param name="gene_tag" value="XF" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
180 <param name="skip_tags_regex" value="^[__|Unassigned]" />
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
181 <param name="per_cell" value="true" />
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
182 <param name="extract_umi_method" value="umis" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
183 <param name="wide_format_cell_counts" value="true" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
184 <output name="out_counts" value="count_single_cells_gene_tag_wide.tsv" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
185 </test>
1
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
186 <test><!-- count ENSDARG00000019692, with defaults -->
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
187 <param name="input_bam" value="fc.ENSDARG00000019692.bam" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
188 <param name="method" value="unique" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
189 <output name="out_counts" value="fc.ENSDARG00000019692.counts" />
3c932ad4a174 planemo upload commit 9a3aeb2c588f9f67824ea5568923ce70b048499a
iuc
parents: 0
diff changeset
190 </test>
3
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
191 <test><!-- count ENSDARG00000019692, relabel string -->
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
192 <param name="input_bam" value="fc.ENSDARG00000019692.bam" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
193 <param name="method" value="unique" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
194 <conditional name="cond_extra" >
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
195 <param name="prepender" value="string" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
196 <param name="custom_label" value="test" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
197 </conditional>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
198 <output name="out_counts" value="fc.ENSDARG00000019692.counts.test" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
199 </test>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
200 <test><!-- count ENSDARG00000019692, relabel filename -->
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
201 <param name="input_bam" value="fc.ENSDARG00000019692.bam" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
202 <param name="method" value="unique" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
203 <conditional name="cond_extra" >
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
204 <param name="prepender" value="dataset name" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
205 </conditional>
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
206 <output name="out_counts" value="fc.ENSDARG00000019692.counts.name" />
b557acca0b56 planemo upload commit a7a086ce7d7d84f53d4a022fa1da25ef7b9a5b9a
iuc
parents: 1
diff changeset
207 </test>
0
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
208 </tests>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
209 <help><![CDATA[
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
210
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
211 UMI Tools count - Count reads per gene from BAM using UMIs
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
212 ----------------------------------------------------------
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
213
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
214 Purpose
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
215 -------
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
216
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
217 The purpose of this command is to count the number of reads per gene based
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
218 on the mapping co-ordinate and the UMI attached to the read.
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
219
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
220
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
221 It is assumed that the FASTQ files were processed with extract_umi.py
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
222 before mapping and thus the UMI is the last word of the read name. e.g:
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
223
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
224 @HISEQ:87:00000000_AATT
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
225
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
226 where AATT is the UMI sequeuence.
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
227
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
228 If you have used an alternative method which does not separate the
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
229 read id and UMI with a "_", such as bcl2fastq which uses ":", you can
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
230 specify the separator, or if your UMIs are encoded in a tag you can also specify this.
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
231
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
232 ]]></help>
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
233 <expand macro="citations" />
8db56d2f8b72 planemo upload commit c79a5f4a05156bb2a6035a844aa9ad8f0e59ecb5
iuc
parents:
diff changeset
234 </tool>