annotate SMART/galaxy/Clusterize.xml @ 46:169d364ddd91

Uploaded
author m-zytnicki
date Mon, 30 Sep 2013 03:19:26 -0400
parents 2c0c0a89fad7
children 97aa2e42bfdf
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
1 <tool id="MergingDataClusterize" name="clusterize">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
2 <description>Clusterize features when their genomic intervals overlap.</description>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
3 <requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
4 <requirement type="set_environment">PYTHONPATH</requirement>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
5 </requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
6 <command interpreter="python">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
7 ../Java/Python/clusterize.py -i $formatType.inputFileName
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
8 #if $formatType.FormatInputFileName == 'bed':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
9 -f bed
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
10 #elif $formatType.FormatInputFileName == 'gff':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
11 -f gff
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
12 #elif $formatType.FormatInputFileName == 'gff2':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
13 -f gff2
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
14 #elif $formatType.FormatInputFileName == 'gff3':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
15 -f gff3
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
16 #elif $formatType.FormatInputFileName == 'sam':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
17 -f sam
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
18 #elif $formatType.FormatInputFileName == 'gtf':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
19 -f gtf
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
20 #end if
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
21 -o $outputFileGff
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
22 $colinear
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
23 $normalize
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
24 -d $distance
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
25 </command>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
26
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
27 <inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
28 <conditional name="formatType">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
29 <param name="FormatInputFileName" type="select" label="Input File Format">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
30 <option value="bed">bed</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
31 <option value="gff">gff</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
32 <option value="gff2">gff2</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
33 <option value="gff3">gff3</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
34 <option value="sam">sam</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
35 <option value="gtf">gtf</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
36 </param>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
37 <when value="bed">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
38 <param name="inputFileName" format="bed" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
39 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
40 <when value="gff">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
41 <param name="inputFileName" format="gff" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
42 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
43 <when value="gff2">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
44 <param name="inputFileName" format="gff2" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
45 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
46 <when value="gff3">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
47 <param name="inputFileName" format="gff3" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
48 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
49 <when value="sam">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
50 <param name="inputFileName" format="sam" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
51 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
52 <when value="gtf">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
53 <param name="inputFileName" format="gtf" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
54 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
55 </conditional>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
56
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
57 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Only merge collinear features"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
58 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="Normalize counts" help="Only works if the nbOccurrences tag is set."/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
59 <param name="distance" type="text" value="0" label="merge features if their relative distance is within N nt"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
60 </inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
61
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
62 <outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
63 <data name="outputFileGff" format="gff3"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
64 </outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
65
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
66 <help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
67 The script clusterizes the input genomic data. Two features are clusterized when their genomic intervals overlap. The output is a GFF3 file, where each element is a cluster. The number of elements in the cluster is given by the tag **nbElements**. The name of a cluster is the concatation of the names of its reads (like **read1--read2--read3**). Note that if the size of the name of the cluster exceeds 100 characters, it is truncated to the first 100 characters.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
68
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
69 Some options may clusterize the features which are closer than a given distance.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
70
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
71 By default, the tool clusterizes all features which overlap (or nearly overlap), even if they are on different strands. If you want to clusterize the features which are on the same strand only, you can specify it.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
72 </help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
73 </tool>