0
|
1 <tool id="phastOdds_for_intervals" name="Compute phastOdds score" version="1.0.0">
|
|
2 <description>for each interval</description>
|
|
3 <command interpreter="python">get_scores_galaxy.py $per_col ${score_file}.h5 ${score_file}.mapping.bed $input $output ${input.metadata.chromCol} ${input.metadata.startCol} ${input.metadata.endCol}</command>
|
|
4 <inputs>
|
|
5 <param format="interval" name="input" type="data" label="Interval file">
|
|
6 <validator type="unspecified_build" message="Unspecified build, this tool works with data from genome builds hg17. Click the pencil icon in your history item to set the genome build."/>
|
|
7 <validator type="dataset_metadata_in_file" filename="phastOdds.loc" metadata_name="dbkey" metadata_column="0" message="Sequences are currently unavailable for the specified build." />
|
|
8 </param>
|
|
9 <param name="score_file" type="select" label="Available datasets">
|
|
10 <options from_file="phastOdds.loc">
|
|
11 <column name="name" index="1"/>
|
|
12 <column name="value" index="2"/>
|
|
13 <column name="dbkey" index="0"/>
|
|
14 <filter type="data_meta" ref="input" key="dbkey" column="0" />
|
|
15 </options>
|
|
16 </param>
|
|
17 <param name="per_col" type="boolean" label="Standardize" help="Standardizes the score to be per alignment column" checked="yes" truevalue="-p" falsevalue=""/>
|
|
18 </inputs>
|
|
19 <outputs>
|
|
20 <data format="interval" name="output" metadata_source="input"/>
|
|
21 </outputs>
|
|
22 <requirements>
|
|
23 <requirement type="python-module">numpy</requirement>
|
|
24 <requirement type="python-module">tables</requirement>
|
|
25 </requirements>
|
|
26 <tests>
|
|
27 <test>
|
|
28 <param name="input" value="4.bed" dbkey="hg17" ftype="bed"/>
|
|
29 <param name="score_file" value="/galaxy/data/phastOdds_precomputed/encode_SEP-2005_tba.v2_phastOdds" />
|
|
30 <param name="per_col" value="true" />
|
|
31 <output name="output" file="phastOdds_tool_out.interval" />
|
|
32 </test>
|
|
33 </tests>
|
|
34 <help>
|
|
35
|
|
36 .. class:: warningmark
|
|
37
|
|
38 This tool currently only works with interval data from genome build hg17.
|
|
39
|
|
40 .. class:: warningmark
|
|
41
|
|
42 This tool assumes that the input dataset is in interval format and contains at least a chrom column, a start column and an end column. These 3 columns can be dispersed throughout any number of other data columns.
|
|
43
|
|
44 -----
|
|
45
|
|
46 **Syntax**
|
|
47
|
|
48 Append a column to each line of an interval file containing the phastOdds score for that interval.
|
|
49
|
|
50 -----
|
|
51
|
|
52 **Example**
|
|
53
|
|
54 If your original data has the following format:
|
|
55
|
|
56 +-----+-----+---+
|
|
57 |chrom|start|end|
|
|
58 +-----+-----+---+
|
|
59
|
|
60 and you choose to compute phastOdds scores, your output will look like this:
|
|
61
|
|
62 +-----+-----+---+-----+
|
|
63 |chrom|start|end|score|
|
|
64 +-----+-----+---+-----+
|
|
65
|
|
66 </help>
|
|
67 </tool>
|