comparison edger-repenrich.xml @ 0:4905a332a094 draft

planemo upload for repository https://github.com/ARTbio/tools-artbio/tree/main/tools/repenrich2 commit 73721d980c1f422dc880d80f61e44d270992e537
author artbio
date Sat, 20 Apr 2024 11:56:53 +0000
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:4905a332a094
1 <tool id="edger-repenrich2" name="edgeR-repenrich" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
2 <description>Determines differentially expressed features from RepEnrich2 counts</description>
3 <macros>
4 <import>macros.xml</import>
5 </macros>
6 <expand macro="edgeR_requirements"/>
7 <stdio>
8 <regex match="Execution halted"
9 source="both"
10 level="fatal"
11 description="Execution halted." />
12 <regex match="Error in"
13 source="both"
14 level="fatal"
15 description="An undefined error occurred, please check your input carefully and contact your administrator." />
16 <regex match="Fatal error"
17 source="both"
18 level="fatal"
19 description="An undefined error occurred, please check your input carefully and contact your administrator." />
20 </stdio>
21 <version_command>
22 <![CDATA[
23 echo $(R --version | grep version | grep -v GNU)", edgeR version" $(R --vanilla --slave -e "library(edgeR) &&
24 cat(sessionInfo()\$otherPkgs\$edgeR\$Version)" 2> /dev/null | grep -v -i "WARNING: ")
25 ]]>
26 </version_command>
27 <command>
28 <![CDATA[
29 #import json
30 Rscript '${__tool_directory__}/edgeR_repenrich.R'
31 --factorName '$factorName'
32
33 --levelNameA '$factorLevel_A'
34 #set $factorlevelsA = list()
35 #for $file in $countsFiles_A:
36 $factorlevelsA.append(str($file))
37 #end for
38 $factorlevelsA.reverse()
39 --levelAfiles '#echo json.dumps(factorlevelsA)#'
40
41 --levelNameB '$factorLevel_B'
42 #set $factorlevelsB = list()
43 #for $file in $countsFiles_B:
44 $factorlevelsB.append(str($file))
45 #end for
46 $factorlevelsB.reverse()
47 --levelBfiles '#echo json.dumps(factorlevelsB)#'
48
49 -o 'edger_out'
50
51 -p '$plots'
52 #if $normCounts:
53 -n '$counts_out'
54 #end if
55 -o '$edger_out'
56 ]]>
57 </command>
58 <inputs>
59 <param name="factorName" type="text" value="FactorName" label="Specify a factor name, e.g. genotype or age or drug_x"
60 help="Only letters, numbers and underscores will be retained in this field">
61 <sanitizer>
62 <valid initial="string.letters,string.digits"><add value="_" /></valid>
63 </sanitizer>
64 </param>
65 <param name="factorLevel_A" type="text" value="FactorLevel1" label="Specify a factor level, typical values could be 'mutant' or 'Drug_X'"
66 help="Only letters, numbers and underscores will be retained in this field">
67 <sanitizer>
68 <valid initial="string.letters,string.digits"><add value="_" /></valid>
69 </sanitizer>
70 </param>
71 <param name="countsFiles_A" type="data" format="tabular" multiple="true" label="Counts file(s)" help="Count files must have been generated by repenrich" />
72 <param name="factorLevel_B" type="text" value="FactorLevel2" label="Specify a factor level, typical values could be 'wildtype' or 'control'"
73 help="Only letters, numbers and underscores will be retained in this field">
74 <sanitizer>
75 <valid initial="string.letters,string.digits"><add value="_" /></valid>
76 </sanitizer>
77 </param>
78 <param name="countsFiles_B" type="data" format="tabular" multiple="true" label="Counts file(s)" help="Count files must have been generated by repenrich tool" />
79 <param name="normCounts" type="boolean" truevalue="1" falsevalue="0" checked="false"
80 label="Output normalized counts table" />
81 </inputs>
82 <outputs>
83 <data format="tabular" name="edger_out" label="edgeR: ${factorLevel_A} compared to ${factorLevel_B}">
84 <actions>
85 <action name="column_names" type="metadata" default="Tag,log2(FC),FDR,Class,Type" />
86 </actions>
87 </data>
88 <data format="pdf" name="plots" label="edgeR plots" />
89 <data format="tabular" name="counts_out" label="Normalized counts file">
90 <filter>normCounts == True</filter>
91 </data>
92 </outputs>
93 <tests>
94 <test expect_num_outputs="3">
95 <param name="factorName" value="Genotype"/>
96 <param name="factorLevel_A" value="Mutant"/>
97 <param name="countsFiles_A" value="355_fraction_counts.tab,356_fraction_counts.tab"/>
98 <param name="factorLevel_B" value="Wildtype"/>
99 <param name="countsFiles_B" value="353_fraction_counts.tab,354_fraction_counts.tab"/>
100 <param name="normCounts" value="True"/>
101 <output name="counts_out" file="Normalized_counts_file.tab"/>
102 <output name="plots" file="edgeR_plots.pdf"/>
103 <output name="edger_out" file="edgeR_result_file.tab"/>
104
105 </test>
106 </tests>
107 <help>
108 <![CDATA[
109 .. class:: infomark
110
111 **What it does**
112
113 Estimate Distance between samples (MDS) and Biological Coefficient Variation (BCV) in count
114 data from high-throughput sequencing assays and test for differential expression using edgeR_.
115
116 **Inputs**
117
118 edger-repenrich takes count tables generated by repenrich as inputs. A repenrich count table looks
119 like:
120
121 ============== ========== ========== ==========
122 LSU-rRNA_Dme rRNA rRNA 3659329
123 -------------- ---------- ---------- ----------
124 FW3_DM LINE Jockey 831
125 -------------- ---------- ---------- ----------
126 DMTOM1_LTR LTR Gypsy 1004
127 -------------- ---------- ---------- ----------
128 R1_DM LINE R1 7343
129 -------------- ---------- ---------- ----------
130 TAHRE LINE Jockey 4560
131 -------------- ---------- ---------- ----------
132 G4_DM LINE Jockey 3668
133 -------------- ---------- ---------- ----------
134 BS LINE Jockey 7296
135 -------------- ---------- ---------- ----------
136 Stalker2_I-int LTR Gypsy 12252
137 -------------- ---------- ---------- ----------
138 Stalker3_LTR LTR Gypsy 593
139 -------------- ---------- ---------- ----------
140 TABOR_I-int LTR Gypsy 3947
141 -------------- ---------- ---------- ----------
142 G7_DM LINE Jockey 162
143 -------------- ---------- ---------- ----------
144 BEL_I-int LTR Pao 23757
145 -------------- ---------- ---------- ----------
146 Gypsy6_I-int LTR Gypsy 7489
147 ============== ========== ========== ==========
148
149 Count tables must be generated for each sample individually. Here, edgeR_ is handling a
150 single factor (genotype, age, treatment, etc) that effect your experiment. This factor has
151 two levels/states (for instance, "wild-type" and "mutant". You need to select appropriate
152 count table from your history for each factor level.
153
154 The following table gives some examples of factors and their levels:
155
156 ========= ============== ===============
157 Factor Factorlevel1 Factorlevel2
158 --------- -------------- ---------------
159 Treatment Treated Untreated
160 --------- -------------- ---------------
161 Genotype Knockdown Wildtype
162 --------- -------------- ---------------
163 TimePoint Day4 Day1
164 --------- -------------- ---------------
165 Gender Female Male
166 ========= ============== ===============
167
168 *Note*: Output log2 fold changes are based on primary factor level 1 vs. factor level2.
169 Here the order of factor levels is important. For example, for the factor 'Treatment' given
170 in above table, edgeR computes fold changes of 'Treated' samples against 'Untreated',
171 i.e. the values correspond to up or down regulations of genes in Treated samples.
172
173 **Output**
174
175 edgeR_ generates a tabular file containing the different columns and results visualized in
176 a PDF:
177
178 ====== =============================================================================
179 Column Description
180 ------ -----------------------------------------------------------------------------
181 1 Tag (transposon element ID)
182 2 the logarithm (to basis 2) of the fold change (See the note in inputs section)
183 3 p value adjusted for multiple testing with the Benjamini-Hochberg procedure
184 which controls false discovery rate (FDR)
185 4 Class the transposon belongs to
186 5 Type the transposon belongs to
187 ====== =============================================================================
188
189 .. _edgeR: http://www.bioconductor.org/packages/release/bioc/html/edgeR.html
190 ]]>
191
192 **Note**: This edgeR_ wrapper was adapted from code available at
193 https://github.com/nskvir/RepEnrich
194
195 </help>
196 <citations>
197 <citation type="doi">10.1093/bioinformatics/btp616</citation>
198 </citations>
199 </tool>