annotate SMART/galaxy/Clusterize.xml @ 36:44d5973c188c

Uploaded
author m-zytnicki
date Tue, 30 Apr 2013 15:02:29 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
36
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
1 <tool id="MergingDataClusterize" name="clusterize">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
2 <description>Clusterize features when their genomic intervals overlap.</description>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
3 <command interpreter="python">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
4 ../Java/Python/clusterize.py -i $formatType.inputFileName
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
5 #if $formatType.FormatInputFileName == 'bed':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
6 -f bed
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
7 #elif $formatType.FormatInputFileName == 'gff':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
8 -f gff
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
9 #elif $formatType.FormatInputFileName == 'gff2':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
10 -f gff2
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
11 #elif $formatType.FormatInputFileName == 'gff3':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
12 -f gff3
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
13 #elif $formatType.FormatInputFileName == 'sam':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
14 -f sam
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
15 #elif $formatType.FormatInputFileName == 'gtf':
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
16 -f gtf
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
17 #end if
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
18 -o $outputFileGff
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
19 $colinear
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
20 $normalize
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
21 -d $distance
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
22 </command>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
23
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
24 <inputs>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
25 <conditional name="formatType">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
26 <param name="FormatInputFileName" type="select" label="Input File Format">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
27 <option value="bed">bed</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
28 <option value="gff">gff</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
29 <option value="gff2">gff2</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
30 <option value="gff3">gff3</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
31 <option value="sam">sam</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
32 <option value="gtf">gtf</option>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
33 </param>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
34 <when value="bed">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
35 <param name="inputFileName" format="bed" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
36 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
37 <when value="gff">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
38 <param name="inputFileName" format="gff" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
39 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
40 <when value="gff2">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
41 <param name="inputFileName" format="gff2" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
42 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
43 <when value="gff3">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
44 <param name="inputFileName" format="gff3" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
45 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
46 <when value="sam">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
47 <param name="inputFileName" format="sam" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
48 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
49 <when value="gtf">
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
50 <param name="inputFileName" format="gtf" type="data" label="Input File"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
51 </when>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
52 </conditional>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
53
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
54 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Only merge collinear features"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
55 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="Normalize counts" help="Only works if the nbOccurrences tag is set."/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
56 <param name="distance" type="text" value="0" label="merge features if their relative distance is within N nt"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
57 </inputs>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
58
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
59 <outputs>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
60 <data name="outputFileGff" format="gff3"/>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
61 </outputs>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
62
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
63 <help>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
64 The script clusterizes the input genomic data. Two features are clusterized when their genomic intervals overlap. The output is a GFF3 file, where each element is a cluster. The number of elements in the cluster is given by the tag **nbElements**. The name of a cluster is the concatation of the names of its reads (like **read1--read2--read3**). Note that if the size of the name of the cluster exceeds 100 characters, it is truncated to the first 100 characters.
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
65
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
66 Some options may clusterize the features which are closer than a given distance.
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
67
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
68 By default, the tool clusterizes all features which overlap (or nearly overlap), even if they are on different strands. If you want to clusterize the features which are on the same strand only, you can specify it.
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
69 </help>
44d5973c188c Uploaded
m-zytnicki
parents:
diff changeset
70 </tool>