annotate SMART/galaxy/Clusterize.xml @ 63:5f210bc9f486

Added a simple test for Clusterize
author m-zytnicki
date Mon, 19 Oct 2015 12:02:29 +0200
parents 90f4b29d884f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
1 <tool id="MergingDataClusterize" name="clusterize">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
2 <description>Clusterize features when their genomic intervals overlap.</description>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
3 <requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
4 <requirement type="set_environment">PYTHONPATH</requirement>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
5 </requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
6 <command interpreter="python">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
7 #set $inputFiles = ",".join(["%s" % (s) for s in $formatType.inputFileName])
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
8 ../Java/Python/clusterize.py -i $inputFiles -f $formatType.FormatInputFileName -o $outputFileGff $colinear $normalize -d $distance
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
9 </command>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
10
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
11 <inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
12 <conditional name="formatType">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
13 <param name="FormatInputFileName" type="select" label="Input File Format">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
14 <option value="bed">bed</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
15 <option value="gff">gff</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
16 <option value="gff2">gff2</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
17 <option value="gff3">gff3</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
18 <option value="sam">sam</option>
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
19 <option value="gtf">gtf</option>
56
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
20 <option value="bam">bam</option>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
21 </param>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
22 <when value="bed">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
23 <param name="inputFileName" format="bed" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
24 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
25 <when value="gff">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
26 <param name="inputFileName" format="gff" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
27 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
28 <when value="gff2">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
29 <param name="inputFileName" format="gff2" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
30 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
31 <when value="gff3">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
32 <param name="inputFileName" format="gff3" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
33 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
34 <when value="sam">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
35 <param name="inputFileName" format="sam" type="data" multiple="true" label="Input File"/>
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
36 </when>
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
37 <when value="gtf">
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
38 <param name="inputFileName" format="gtf" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
39 </when>
56
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
40 <when value="bam">
60
90f4b29d884f Uploaded
m-zytnicki
parents: 56
diff changeset
41 <param name="inputFileName" format="bam" type="data" multiple="true" label="Input File"/>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
42 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
43 </conditional>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
44
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
45 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Only merge collinear features"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
46 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="Normalize counts" help="Only works if the nbOccurrences tag is set."/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
47 <param name="distance" type="text" value="0" label="merge features if their relative distance is within N nt"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
48 </inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
49
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
50 <outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
51 <data name="outputFileGff" format="gff3"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
52 </outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
53
63
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
54 <tests>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
55 <test>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
56 <!-- basic test -->
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
57 <param name="FormatInputFileName" value="bed"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
58 <param name="inputFileName" value="smart_1.bed" ftype="bed"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
59 <param name="colinear" value="false"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
60 <param name="normalize" value="false"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
61 <param name="distance" value="0"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
62 <output name="output" file="smart_clusterize_out_1.gff3" ftype="gff3"/>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
63 </test>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
64 </tests>
5f210bc9f486 Added a simple test for Clusterize
m-zytnicki
parents: 60
diff changeset
65
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
66 <help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
67 The script clusterizes the input genomic data. Two features are clusterized when their genomic intervals overlap. The output is a GFF3 file, where each element is a cluster. The number of elements in the cluster is given by the tag **nbElements**. The name of a cluster is the concatation of the names of its reads (like **read1--read2--read3**). Note that if the size of the name of the cluster exceeds 100 characters, it is truncated to the first 100 characters.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
68
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
69 Some options may clusterize the features which are closer than a given distance.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
70
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
71 By default, the tool clusterizes all features which overlap (or nearly overlap), even if they are on different strands. If you want to clusterize the features which are on the same strand only, you can specify it.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
72 </help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
73 </tool>