annotate SMART/galaxy/Clusterize.xml @ 58:5f5c9b74c2dd

Uploaded
author m-zytnicki
date Fri, 07 Feb 2014 11:53:36 -0500
parents 97aa2e42bfdf
children 90f4b29d884f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
1 <tool id="MergingDataClusterize" name="clusterize">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
2 <description>Clusterize features when their genomic intervals overlap.</description>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
3 <requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
4 <requirement type="set_environment">PYTHONPATH</requirement>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
5 </requirements>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
6 <command interpreter="python">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
7 ../Java/Python/clusterize.py -i $formatType.inputFileName
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
8 #if $formatType.FormatInputFileName == 'bed':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
9 -f bed
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
10 #elif $formatType.FormatInputFileName == 'gff':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
11 -f gff
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
12 #elif $formatType.FormatInputFileName == 'gff2':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
13 -f gff2
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
14 #elif $formatType.FormatInputFileName == 'gff3':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
15 -f gff3
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
16 #elif $formatType.FormatInputFileName == 'sam':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
17 -f sam
56
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
18 #elif $formatType.FormatInputFileName == 'bam':
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
19 -f bam
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
20 #elif $formatType.FormatInputFileName == 'gtf':
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
21 -f gtf
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
22 #end if
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
23 -o $outputFileGff
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
24 $colinear
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
25 $normalize
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
26 -d $distance
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
27 </command>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
28
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
29 <inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
30 <conditional name="formatType">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
31 <param name="FormatInputFileName" type="select" label="Input File Format">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
32 <option value="bed">bed</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
33 <option value="gff">gff</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
34 <option value="gff2">gff2</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
35 <option value="gff3">gff3</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
36 <option value="sam">sam</option>
56
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
37 <option value="bam">bam</option>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
38 <option value="gtf">gtf</option>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
39 </param>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
40 <when value="bed">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
41 <param name="inputFileName" format="bed" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
42 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
43 <when value="gff">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
44 <param name="inputFileName" format="gff" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
45 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
46 <when value="gff2">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
47 <param name="inputFileName" format="gff2" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
48 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
49 <when value="gff3">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
50 <param name="inputFileName" format="gff3" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
51 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
52 <when value="sam">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
53 <param name="inputFileName" format="sam" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
54 </when>
56
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
55 <when value="bam">
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
56 <param name="inputFileName" format="bam" type="data" label="Input File"/>
97aa2e42bfdf Uploaded
m-zytnicki
parents: 38
diff changeset
57 </when>
38
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
58 <when value="gtf">
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
59 <param name="inputFileName" format="gtf" type="data" label="Input File"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
60 </when>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
61 </conditional>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
62
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
63 <param name="colinear" type="boolean" truevalue="-c" falsevalue="" checked="false" label="Only merge collinear features"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
64 <param name="normalize" type="boolean" truevalue="-n" falsevalue="" checked="false" label="Normalize counts" help="Only works if the nbOccurrences tag is set."/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
65 <param name="distance" type="text" value="0" label="merge features if their relative distance is within N nt"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
66 </inputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
67
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
68 <outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
69 <data name="outputFileGff" format="gff3"/>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
70 </outputs>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
71
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
72 <help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
73 The script clusterizes the input genomic data. Two features are clusterized when their genomic intervals overlap. The output is a GFF3 file, where each element is a cluster. The number of elements in the cluster is given by the tag **nbElements**. The name of a cluster is the concatation of the names of its reads (like **read1--read2--read3**). Note that if the size of the name of the cluster exceeds 100 characters, it is truncated to the first 100 characters.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
74
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
75 Some options may clusterize the features which are closer than a given distance.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
76
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
77 By default, the tool clusterizes all features which overlap (or nearly overlap), even if they are on different strands. If you want to clusterize the features which are on the same strand only, you can specify it.
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
78 </help>
2c0c0a89fad7 Uploaded
m-zytnicki
parents:
diff changeset
79 </tool>