Mercurial > repos > iuc > deg_annotate
comparison deg_annotate.xml @ 0:b42373cddb77 draft
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/deg_annotate commit bc766aeec78fe74a1d70d608d2f73ba3f2a3e047
author | iuc |
---|---|
date | Fri, 23 Nov 2018 01:59:47 -0500 |
parents | |
children | e98d4ab5b5bc |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:b42373cddb77 |
---|---|
1 <tool id="deg_annotate" name="Annotate DESeq2/DEXSeq output tables" version="1.0"> | |
2 <description>Append useful information from annotation files to DESeq2/DEXSeq outputs</description> | |
3 <requirements> | |
4 <requirement type="package" version="2.27.0">bedtools</requirement> | |
5 <requirement type="package" version="0.6.4">bcbiogff</requirement> | |
6 </requirements> | |
7 <command> | |
8 <![CDATA[ | |
9 python '$__tool_directory__/deg_annotate.py' -in '$input_table' | |
10 -m '$mode' | |
11 -g '$annotation' | |
12 -t '$advanced_parameters.gff_feature_type' | |
13 -i '$advanced_parameters.gff_feature_attribute' | |
14 -x '$advanced_parameters.gff_transcript_attribute' | |
15 -a '$advanced_parameters.gff_attributes' | |
16 -o '$output' | |
17 ]]> | |
18 </command> | |
19 <inputs> | |
20 <param name="input_table" | |
21 type="data" | |
22 format="tabular" | |
23 argument="-in" | |
24 label="Tabular output of DESeq2 or DEXSeq"/> | |
25 | |
26 <param name="mode" type="select" argument="-m" label="Input file type"> | |
27 <option value="deseq2">DESeq2</option> | |
28 <option value="dexseq">DEXseq</option> | |
29 </param> | |
30 | |
31 <param name="annotation" | |
32 type="data" | |
33 format="gff,gtf,gff3" | |
34 argument="-g" | |
35 label="Reference annotation in GFF/GTF format" /> | |
36 | |
37 <section name="advanced_parameters" title="Advanced options"> | |
38 <param name="gff_feature_type" | |
39 type="text" | |
40 value="exon" | |
41 argument="-t" | |
42 label="GFF feature type" | |
43 help="This is the 3rd column in GFF file. Only rows which have the matched feature type in the GTF annotation file will be included. `exon' by default." /> | |
44 | |
45 <param name="gff_feature_attribute" | |
46 type="text" | |
47 value="gene_id" | |
48 argument="-i" | |
49 label="GFF feature identifier" | |
50 help="GFF attribute to be used as feature identifier. The value of this attribute should match the first column of DESeq2 output (default: gene_id)" /> | |
51 | |
52 <param name="gff_transcript_attribute" | |
53 type="text" | |
54 value="transcript_id" | |
55 argument="-x" | |
56 label="GFF transcript identifier" | |
57 help="GFF attribute to be used as transcript identifier. This options is only used for DEXSeq output annotation. Exon numbers are counted for each transcript separately (default: transcript_id)" /> | |
58 | |
59 <param name="gff_attributes" | |
60 type="text" | |
61 value="gene_biotype, gene_name" | |
62 argument="-a" | |
63 label="GFF attributes to include" | |
64 help="Comma separated list of attributes from GFF file to include in output. These attributes should associate with your chosen GFF feature type." /> | |
65 </section> | |
66 </inputs> | |
67 <outputs> | |
68 <data name="output" format="tabular" label="${tool.name} on ${on_string}"/> | |
69 </outputs> | |
70 <tests> | |
71 <test expect_num_outputs="1"> | |
72 <param name="input_table" | |
73 value="deseq2_output.tabular"/> | |
74 <param name="annotation" | |
75 value="annotation.gtf"/> | |
76 <output name="output"> | |
77 <assert_contents> | |
78 <has_text_matching expression="FBgn0025111\t2192.32236942864\t2.69993841720991\t0.0979447231457099\t27.565940568266\t2.8504782974107e-167\t6.1121380892229e-164\tchrX\t10778953\t10786907\t-\tprotein_coding\tAnt2"/> | |
79 </assert_contents> | |
80 </output> | |
81 </test> | |
82 <test expect_num_outputs="1"> | |
83 <param name="input_table" | |
84 value="dexseq_output.tabular"/> | |
85 <param name="annotation" | |
86 value="annotation.gtf"/> | |
87 <param name="mode" | |
88 value="dexseq"/> | |
89 <output name="output"> | |
90 <assert_contents> | |
91 <has_text_matching expression="FBgn0025111\+FBgn0003360:E005\tFBgn0025111\+FBgn0003360\tE005\t0.273966640920426\t6.62572321505791\t0.774068626605711\t0.378961325638675\tNA\t0.41523701984849\t1.17020080867011\t2.99101950917789\tchrX\t10780596\t10780661\t66\t-\t10\t0\t0\t0\t0\t0\t2\tFBtr0073425, FBtr0333963\tprotein_coding\+protein_coding\tAnt2\+sesB\tFBtr0073425:1,FBtr0333963:1"/> | |
92 </assert_contents> | |
93 </output> | |
94 </test> | |
95 </tests> | |
96 | |
97 <help> | |
98 <![CDATA[ | |
99 | |
100 **What it does** | |
101 | |
102 This tool appends the output table of DESeq2 or DEXSeq with gene symbols, biotypes, positions etc. The information | |
103 you want to add is configurable. This information should present in the input GTF/GFF file as attributes of feature | |
104 you choose. | |
105 DEXSeq-Count tool is used to prepare the DEXSeq compatible annotation (flattened GTF file) from input GTF/GFF. In | |
106 this process, the exons that appear multiple times, once for each transcript are collapsed to so called | |
107 *exon counting bins*. Counting bins for parts of exons arise when an exonic region appears with different | |
108 boundaries in different transcripts. The resulting flattened GTF file contains pseudo exon ids per gene instead | |
109 of per transcript. This tool maps the DEXSeq couting bins back to the original exon ids. This mapping is only | |
110 possible if the input GTF/GFF file contains transcript identifier attribute for the chosen features type. | |
111 | |
112 **Inputs** | |
113 | |
114 **Differential gene expression tables** | |
115 At the moment, this tool supports DESeq2 and DEXSeq tool outputs. | |
116 | |
117 **Annotation** | |
118 Annotation file ne GTF or GFF3 format that was used for counting. | |
119 | |
120 **Outputs** | |
121 Input tabular file and with chosen attributes appended as additional columns. | |
122 | |
123 ]]> | |
124 </help> | |
125 </tool> |