comparison rcas.xml @ 1:7c7a2a381dfe draft default tip

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/rna_tools/rcas/ commit 5c6486dead878a8c9521e1d6d50b3a537a2ec2b0
author rnateam
date Thu, 21 Jun 2018 15:07:13 -0400
parents aa9579837a2e
children
comparison
equal deleted inserted replaced
0:aa9579837a2e 1:7c7a2a381dfe
1 <?xml version="1.0" encoding="UTF-8"?> 1 <tool id="rcas" name="RCAS" version="1.5.4">
2 <tool id="rcas" name="RNA Centric Annotation System" version="1.1.1"> 2 <description>- RNA Centric Annotation System</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="1.1.1">bioconductor-rcas</requirement> 4 <requirement type="package" version="1.5.4">bioconductor-rcas</requirement>
5 </requirements> 5 </requirements>
6 <stdio> 6 <stdio>
7 <regex match="Execution halted" source="both" level="fatal" description="Execution halted." /> 7 <regex match="Execution halted" source="both" level="fatal" description="Execution halted." />
8 <exit_code range="1:" /> 8 <exit_code range="1:" />
9 </stdio> 9 </stdio>
10 <command><![CDATA[Rscript '$script_file' 10 <command><![CDATA[
11 11 cat '$script_file' &&
12 && 12 #if $analysis_type.analysis_type_selector == 'single_set_analysis':
13 mv *RCAS.report.html RCAS.report.html 13 Rscript '$script_file' &&
14 14 mv *RCAS.report.html RCAS.report.html
15 15 #if $run_annot == "TRUE":
16 #if $run_anot == "TRUE": 16 &&
17 && 17 mv Figure*summarizeQueryRegions.data.tsv summarizeQueryRegions.data.tsv &&
18 mv Figure*summarizeQueryRegions.data.tsv summarizeQueryRegions.data.tsv && 18 mv Figure*query_gene_types.data.tsv query_gene_types.data.tsv &&
19 mv Figure*query_gene_types.data.tsv query_gene_types.data.tsv && 19 mv Figure*transcriptBoundaryCoverage.fiveprime.data.tsv transcriptBoundaryCoverage.fiveprime.data.tsv &&
20 mv Figure*transcriptBoundaryCoverage.fiveprime.data.tsv transcriptBoundaryCoverage.fiveprime.data.tsv && 20 mv Figure*transcriptBoundaryCoverage.threeprime.data.tsv transcriptBoundaryCoverage.threeprime.data.tsv &&
21 mv Figure*transcriptBoundaryCoverage.threeprime.data.tsv transcriptBoundaryCoverage.threeprime.data.tsv && 21 mv Figure*exonIntronBoundaryCoverage.fiveprime.data.tsv exonIntronBoundaryCoverage.fiveprime.data.tsv &&
22 mv Figure*exonIntronBoundaryCoverage.fiveprime.data.tsv exonIntronBoundaryCoverage.fiveprime.data.tsv && 22 mv Figure*exonIntronBoundaryCoverage.threeprime.data.tsv exonIntronBoundaryCoverage.threeprime.data.tsv &&
23 mv Figure*exonIntronBoundaryCoverage.threeprime.data.tsv exonIntronBoundaryCoverage.threeprime.data.tsv && 23 mv Figure*coverageprofilelist.data.tsv coverageprofilelist.data.tsv &&
24 mv Figure*coverageprofilelist.data.tsv coverageprofilelist.data.tsv && 24 mv Table*getTargetedGenesTable.data.tsv getTargetedGenesTable.data.tsv
25 mv Table*getTargetedGenesTable.data.tsv getTargetedGenesTable.data.tsv 25 #end if
26 #if $analysis_type.run_go == "TRUE":
27 &&
28 mv Table*goBP.data.tsv goBP.data.tsv &&
29 mv Table*goMF.data.tsv goMF.data.tsv &&
30 mv Table*goCC.data.tsv goCC.data.tsv
31 #end if
32
33 #if $analysis_type.gsea_set.run_gsea == "TRUE":
34 &&
35 mv Table*GSEA.data.tsv GSEA.data.tsv
36 #end if
37 #else:
38 Rscript '$script_file'
26 #end if 39 #end if
27 40 ]]></command>
28 41 <configfiles>
29 #if $run_GOrich == "TRUE": 42 <configfile name="script_file"><![CDATA[
30 && 43 #import re
31 mv Table*goBP.data.tsv goBP.data.tsv && 44 library("RCAS")
32 mv Table*goMF.data.tsv goMF.data.tsv && 45 #if $analysis_type.analysis_type_selector == 'single_set_analysis':
33 mv Table*goCC.data.tsv goCC.data.tsv 46 runReport(queryFilePath = '${analysis_type.single_bed_file}',
47 gffFilePath = '${input_gtf_file}',
48 genomeVersion = '${genome_version}',
49 #if $analysis_type.run_go
50 goAnalysis = TRUE,
51 #end if
52 #if $analysis_type.gsea_set.run_gsea
53 msigdbAnalysis = TRUE,
54 msigdbFilePath = '${$analysis_type.gsea_set.input_human_msigdb_gmt}',
55 #end if
56 sampleN = '${analysis_type.downsampling}',
57 annotationSummary = ${run_annot},
58 motifAnalysis = ${run_motif},
59 outDir = getwd(),
60 #if $analysis_type.output_raw_tables
61 printProcessedTables = TRUE,
62 #end if
63 selfContained = TRUE)
64 #elif $analysis_type.analysis_type_selector == 'multi_set_analysis':
65 library("mgcv")
66 paths <- c('#echo "','".join(map(str, $analysis_type.multi_bed_file))#')
67 #set $ids = [re.sub('[^\w\-]', '_', str($bed_file.element_identifier)) for $bed_file in $analysis_type.multi_bed_file]
68 ids <- c('#echo "','".join($ids)#')
69 projData <- data.frame('sampleName' = ids, 'bedFilePath' = paths, stringsAsFactors = FALSE)
70 projDataFile <- file.path(getwd(), 'myProjDataFile.tsv')
71 write.table(projData, projDataFile, sep = '\t', quote =FALSE, row.names = FALSE)
72 gtfFilePath = '${input_gtf_file}'
73 databasePath <- file.path(getwd(), 'myProject.sqlite')
74 invisible(createDB(dbPath = databasePath, projDataFile = projDataFile, gtfFilePath = gtfFilePath,
75 motifAnalysis = ${run_motif},
76 annotationSummary = ${run_annot},
77 genomeVersion = '${genome_version}'))
78 sampleData <- data.frame('sampleName' = ids, 'sampleGroup' = ids, stringsAsFactors = FALSE)
79 sampleDataFile <- file.path(getwd(), 'mySampleDataTable.tsv')
80 write.table(sampleData, sampleDataFile, sep = '\t', quote =FALSE, row.names = FALSE)
81 runReportMetaAnalysis(dbPath = databasePath, sampleTablePath = sampleDataFile, outFile = file.path(getwd(), 'RCAS.multi_sample_report.html'))
34 #end if 82 #end if
35 83 ]]></configfile>
36
37 #if $choice.run_PATHrich == "TRUE":
38 &&
39 mv Table*GSEA.data.tsv GSEA.data.tsv
40 #end if
41
42
43 #if $run_motif == "TRUE":
44 &&
45 mv Table*motif_analysis_table.data.tsv motif_analysis_table.data.tsv
46 #end if]]></command>
47 <configfiles>
48 <configfile name="script_file">library("RCAS")
49
50 runReport(queryFilePath = '${input_BED}',
51
52 gffFilePath = '${input_GTF}',
53
54 #if $choice.run_PATHrich == "TRUE":
55 msigdbFilePath = '${choice.input_human_msigdb_gmt}',
56 #end if
57
58 annotationSummary = ${run_anot},
59
60 goAnalysis = ${run_GOrich},
61
62 msigdbAnalysis = ${choice.run_PATHrich},
63
64 motifAnalysis = ${run_motif},
65
66 genomeVersion = '${genomeVersion}',
67
68 outDir = getwd(),
69
70 printProcessedTables = TRUE,
71
72 sampleN = '${downsampling}',
73
74 selfContained = TRUE)</configfile>
75 </configfiles> 84 </configfiles>
76 <inputs> 85 <inputs>
77 <param name="genomeVersion" type="select" label="Genome Version"> 86 <param name="genome_version" type="select" label="Genome Version">
78 <option value="hg19" selected="true">hg19</option> 87 <option value="hg19" selected="true">hg19</option>
88 <option value="hg38">hg38</option>
89 <option value="mm9">mm9</option>
90 <option value="mm10">mm10</option>
79 <option value="dm3">dm3</option> 91 <option value="dm3">dm3</option>
80 <option value="ce10">ce10</option> 92 <option value="ce10">ce10</option>
81 <option value="mm9">mm9</option>
82 </param> 93 </param>
83 <param name="input_BED" type="data" format="BED" label="Target regions in BED format" help="The coordinates should be in accord with Genome Version." /> 94
84 <param name="input_GTF" type="data" format="GTF" label="Reference annotation in ENSEMBL GTF format" /> 95 <param name="input_gtf_file" type="data" format="GTF" label="Reference annotation in ENSEMBL GTF format" />
85 <param name="run_anot" label="Run annotation." type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="True" help="Use this option if you want to run annotation." /> 96
86 <param name="run_GOrich" label="Run GO term enrichment" type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="False" help="Use this option if you want to run GO term enrichment (supported genome versions: hg19, mm9, dm3)." /> 97 <conditional name="analysis_type">
87 <conditional name="choice"> 98 <param name="analysis_type_selector" type="select" label="Select analysis type">
88 <param name="run_PATHrich" type="select" label="Run gene set enrichment" help="Use this option if you want to run gene set enrichment."> 99 <option value="single_set_analysis" selected="true">Single sample analysis</option>
89 <option value="FALSE" selected="True">No</option> 100 <option value="multi_set_analysis">Multi sample analysis</option>
90 <option value="TRUE">Yes</option>
91 </param> 101 </param>
92 <when value="TRUE"> 102 <!-- Single dataset analysis -->
93 <param name="input_human_msigdb_gmt" type="data" format="tabular" label="Human Molecular Signatures Database (MSigDB)" help="The database is usesd for gene set enrichment (supported genome versions: hg19, mm9, dm3). For non-human species, the human MSigDB will be automatically converted accordingly." /> 103 <when value="single_set_analysis">
104 <param name="single_bed_file" type="data" format="bed"
105 label="Single sample analysis BED file"
106 help="Genomic BED file used for single sample analysis"/>
107 <param name="run_go" label="Run GO term enrichment analysis"
108 type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="False"
109 help="Run GO term enrichment analysis (supported genome versions: hg19, hg38, mm9, mm10, dm3)" />
110 <conditional name="gsea_set">
111 <param name="run_gsea" type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="false" label="Run gene set enrichment analysis"/>
112 <when value="FALSE" />
113 <when value="TRUE">
114 <param name="input_human_msigdb_gmt" type="data" format="tabular"
115 label="Provide human Molecular Signatures Database (MSigDB) file"
116 help="This database file is needed for gene set enrichment analysis (supported genome versions: hg19, hg38, mm9, mm10, dm3). For non-human species, the human MSigDB will be automatically converted." />
117 </when>
118 </conditional>
119 <param name="downsampling" label="Downsampling (N)" type="text" value="0"
120 help="Randomly sample down query regions to (N). To activate sampling a positive integer value smaller than the total number of query regions should be given. Default value is 0 (i.e. no downsampling applied)" />
121 <param name="output_raw_tables" type="boolean" falsevalue="FALSE" truevalue="TRUE" value="False"
122 label="Output raw data tables"
123 help="Output single sample analysis raw data tables that are used for plots/tables as text files"/>
94 </when> 124 </when>
95 <when value="FALSE" /> 125 <!-- Multiple datasets meta analysis -->
126 <when value="multi_set_analysis">
127 <param name="multi_bed_file" type="data" format="bed"
128 label="Multi sample analysis BED files" multiple="true"
129 help="Genomic BED files used for multi sample analysis. NOTE that the dataset name inside the Galaxy history is used as identifier for each set, resulting in plots with the Galaxy dataset names corresponding to their respective input BED files."/>
130 </when>
96 </conditional> 131 </conditional>
97 <param name="run_motif" label="Run motif search" type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="False" help="Use this option if you want to run motif search." /> 132
98 <param name="downsampling" label="Downsampling (N)" type="text" value="0" help="Randomly sample query regions down to (N)" /> 133 <!-- Parameters common to multi and single set analysis -->
134 <param name="run_annot" label="Output annotation summaries" type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="True" help="Output annotation summaries from overlap operations" />
135 <param name="run_motif" label="Run motif analysis" type="boolean" falsevalue="FALSE" truevalue="TRUE" checked="False" help="Run motif analysis for each input dataset and each transcript region" />
99 </inputs> 136 </inputs>
100 <outputs> 137 <outputs>
101 <data name="report" format="html" from_work_dir="RCAS.report.html" label="${tool.name} on ${on_string}: dynamic HTML" /> 138 <data name="report" format="html" from_work_dir="RCAS.report.html" label="${tool.name} on ${on_string}: single sample analysis report HTML">
139 <filter>analysis_type["analysis_type_selector"] == "single_set_analysis"</filter>
140 </data>
102 <data name="summarizeQueryRegions" format="tsv" from_work_dir="summarizeQueryRegions.data.tsv" label="${tool.name} on ${on_string}: Query regions summary"> 141 <data name="summarizeQueryRegions" format="tsv" from_work_dir="summarizeQueryRegions.data.tsv" label="${tool.name} on ${on_string}: Query regions summary">
103 <filter>run_anot == True</filter> 142 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
104 </data> 143 </data>
105 <data name="query_gene_types" format="tsv" from_work_dir="query_gene_types.data.tsv" label="${tool.name} on ${on_string}: Query gene types"> 144 <data name="query_gene_types" format="tsv" from_work_dir="query_gene_types.data.tsv" label="${tool.name} on ${on_string}: Query gene types">
106 <filter>run_anot == True</filter> 145 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
107 </data> 146 </data>
108 <data name="transcriptBoundaryCoverage.fiveprime" format="tsv" from_work_dir="transcriptBoundaryCoverage.fiveprime.data.tsv" label="${tool.name} on ${on_string}: Transcript boundary coverage (5')"> 147 <data name="transcriptBoundaryCoverage.fiveprime" format="tsv" from_work_dir="transcriptBoundaryCoverage.fiveprime.data.tsv" label="${tool.name} on ${on_string}: Transcript boundary coverage (5')">
109 <filter>run_anot == True</filter> 148 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
110 </data> 149 </data>
111 <data name="transcriptBoundaryCoverage.threeprime" format="tsv" from_work_dir="transcriptBoundaryCoverage.threeprime.data.tsv" label="${tool.name} on ${on_string}: Transcript boundary coverage (3')"> 150 <data name="transcriptBoundaryCoverage.threeprime" format="tsv" from_work_dir="transcriptBoundaryCoverage.threeprime.data.tsv" label="${tool.name} on ${on_string}: Transcript boundary coverage (3')">
112 <filter>run_anot == True</filter> 151 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
113 </data> 152 </data>
114 <data name="exonIntronBoundaryCoverage.fiveprime" format="tsv" from_work_dir="exonIntronBoundaryCoverage.fiveprime.data.tsv" label="${tool.name} on ${on_string}: Exon-intron boundary coverage (5')"> 153 <data name="exonIntronBoundaryCoverage.fiveprime" format="tsv" from_work_dir="exonIntronBoundaryCoverage.fiveprime.data.tsv" label="${tool.name} on ${on_string}: Exon-intron boundary coverage (5')">
115 <filter>run_anot == True</filter> 154 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
116 </data> 155 </data>
117 <data name="exonIntronBoundaryCoverage.threeprime" format="tsv" from_work_dir="exonIntronBoundaryCoverage.threeprime.data.tsv" label="${tool.name} on ${on_string}: Exon-intron boundary coverage (3')"> 156 <data name="exonIntronBoundaryCoverage.threeprime" format="tsv" from_work_dir="exonIntronBoundaryCoverage.threeprime.data.tsv" label="${tool.name} on ${on_string}: Exon-intron boundary coverage (3')">
118 <filter>run_anot == True</filter> 157 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
119 </data> 158 </data>
120 <data name="coverageprofilelist" format="tsv" from_work_dir="coverageprofilelist.data.tsv" label="${tool.name} on ${on_string}: Coverage profile list"> 159 <data name="coverageprofilelist" format="tsv" from_work_dir="coverageprofilelist.data.tsv" label="${tool.name} on ${on_string}: Coverage profile list">
121 <filter>run_anot == True</filter> 160 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
122 </data> 161 </data>
123 <data name="getTargetedGenesTable" format="tsv" from_work_dir="getTargetedGenesTable.data.tsv" label="${tool.name} on ${on_string}: Targeted genes"> 162 <data name="getTargetedGenesTable" format="tsv" from_work_dir="getTargetedGenesTable.data.tsv" label="${tool.name} on ${on_string}: Targeted genes">
124 <filter>run_anot == True</filter> 163 <filter>run_annot is True and analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['output_raw_tables'] is True</filter>
125 </data> 164 </data>
126 <data name="goCC" format="tsv" from_work_dir="goCC.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (cellular compartments)"> 165 <data name="goCC" format="tsv" from_work_dir="goCC.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (cellular compartments)">
127 <filter>run_GOrich == True</filter> 166 <filter>analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['run_go'] is True and analysis_type['output_raw_tables'] is True</filter>
128 </data> 167 </data>
129 <data name="goBP" format="tsv" from_work_dir="goBP.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (biological processes)"> 168 <data name="goBP" format="tsv" from_work_dir="goBP.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (biological processes)">
130 <filter>run_GOrich == True</filter> 169 <filter>analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['run_go'] is True and analysis_type['output_raw_tables'] is True</filter>
131 </data> 170 </data>
132 <data name="goMF" format="tsv" from_work_dir="goMF.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (molecular functions)"> 171 <data name="goMF" format="tsv" from_work_dir="goMF.data.tsv" label="${tool.name} on ${on_string}: GO term enrichment (molecular functions)">
133 <filter>run_GOrich == True</filter> 172 <filter>analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['run_go'] is True and analysis_type['output_raw_tables'] is True</filter>
134 </data> 173 </data>
135 <data name="GSEA" format="tsv" from_work_dir="GSEA.data.tsv" label="${tool.name} on ${on_string}: Gene set enrichment analysis"> 174 <data name="GSEA" format="tsv" from_work_dir="GSEA.data.tsv" label="${tool.name} on ${on_string}: Gene set enrichment analysis">
136 <filter>choice['run_PATHrich'] == "TRUE"</filter> 175 <filter>analysis_type["analysis_type_selector"] == "single_set_analysis" and analysis_type['gsea_set']['run_gsea'] is True and analysis_type['output_raw_tables'] is True</filter>
137 </data> 176 </data>
138 <data name="motif" format="tsv" from_work_dir="motif_analysis_table.data.tsv" label="${tool.name} on ${on_string}: Motif"> 177 <data name="multi_report" format="html" from_work_dir="RCAS.multi_sample_report.html" label="${tool.name} on ${on_string}: multi sample analysis report HTML">
139 <filter>run_motif == True</filter> 178 <filter>analysis_type["analysis_type_selector"] == "multi_set_analysis"</filter>
140 </data> 179 </data>
141 </outputs> 180 </outputs>
142 <tests> 181 <tests>
143 <test> 182 <test>
144 <param name="input_BED" value="input.TIA1.bed" /> 183 <param name="analysis_type_selector" value="single_set_analysis"/>
145 <param name="input_GTF" value="input.Homo_sapiens.GRCh37-chr1-f10k.75.gtf" /> 184 <param name="single_bed_file" value="input.TIA1.bed"/>
146 <param name="input_human_msigdb_gmt" value="input.msigdb_test.gmt" /> 185 <param name="input_gtf_file" value="input.Homo_sapiens.GRCh37-chr1-f10k.75.gtf"/>
147 <param name="run_anot" value="TRUE" /> 186 <param name="input_human_msigdb_gmt" value="input.msigdb_test.gmt"/>
148 <param name="run_GOrich" value="TRUE" /> 187 <param name="run_annot" value="TRUE"/>
149 <param name="run_PATHrich" value="TRUE" /> 188 <param name="run_go" value="TRUE"/>
150 <param name="run_motif" value="TRUE" /> 189 <param name="run_gsea" value="TRUE"/>
151 <param name="genomeVersion" value="hg19" /> 190 <param name="run_motif" value="TRUE"/>
152 <output name="report" file="output.TIA1.bed.RCAS.report.html" ftype="html" compare="sim_size" /> 191 <param name="output_raw_tables" value="TRUE"/>
153 <output name="summarizeQueryRegions" file="summarizeQueryRegions.data.tsv" ftype="tsv" /> 192 <param name="genome_version" value="hg19" />
154 <output name="query_gene_types" file="query_gene_types.data.tsv" ftype="tsv" /> 193 <output name="report" file="input.TIA1.bed.RCAS.report.html" ftype="html" compare="sim_size"/>
155 <output name="transcriptBoundaryCoverage.fiveprime" file="transcriptBoundaryCoverage.fiveprime.data.tsv" ftype="tsv" /> 194 <output name="summarizeQueryRegions" file="summarizeQueryRegions.data.tsv" ftype="tsv"/>
156 <output name="transcriptBoundaryCoverage.threeprime" file="transcriptBoundaryCoverage.threeprime.data.tsv" ftype="tsv" /> 195 <output name="query_gene_types" file="query_gene_types.data.tsv" ftype="tsv"/>
157 <output name="exonIntronBoundaryCoverage.fiveprime" file="exonIntronBoundaryCoverage.fiveprime.data.tsv" ftype="tsv" /> 196 <output name="transcriptBoundaryCoverage.fiveprime" file="transcriptBoundaryCoverage.fiveprime.data.tsv" ftype="tsv"/>
158 <output name="exonIntronBoundaryCoverage.threeprime" file="exonIntronBoundaryCoverage.threeprime.data.tsv" ftype="tsv" /> 197 <output name="transcriptBoundaryCoverage.threeprime" file="transcriptBoundaryCoverage.threeprime.data.tsv" ftype="tsv"/>
159 <output name="coverageprofilelist" file="coverageprofilelist.data.tsv" ftype="tsv" /> 198 <output name="exonIntronBoundaryCoverage.fiveprime" file="exonIntronBoundaryCoverage.fiveprime.data.tsv" ftype="tsv"/>
160 <output name="getTargetedGenesTable" file="getTargetedGenesTable.data.tsv" ftype="tsv" /> 199 <output name="exonIntronBoundaryCoverage.threeprime" file="exonIntronBoundaryCoverage.threeprime.data.tsv" ftype="tsv"/>
200 <output name="coverageprofilelist" file="coverageprofilelist.data.tsv" ftype="tsv"/>
201 <output name="getTargetedGenesTable" file="getTargetedGenesTable.data.tsv" ftype="tsv"/>
161 <output name="goCC" file="goCC.data.tsv" ftype="tsv" compare="sim_size"/> 202 <output name="goCC" file="goCC.data.tsv" ftype="tsv" compare="sim_size"/>
162 <output name="goBP" file="goBP.data.tsv" ftype="tsv" compare="sim_size"/> 203 <output name="goBP" file="goBP.data.tsv" ftype="tsv" compare="sim_size"/>
163 <output name="goMF" file="goMF.data.tsv" ftype="tsv" compare="sim_size"/> 204 <output name="goMF" file="goMF.data.tsv" ftype="tsv" compare="sim_size"/>
164 <output name="GSEA" file="GSEA.data.tsv" ftype="tsv" /> 205 <output name="GSEA" file="GSEA.data.tsv" ftype="tsv"/>
165 <output name="motif" file="motif_analysis_table.data.tsv" ftype="tsv" compare="sim_size" /> 206 </test>
207 <test>
208 <param name="analysis_type_selector" value="multi_set_analysis"/>
209 <param name="multi_bed_file" value="EIF4A3Sauliere20121a.bed,EIF4A3Sauliere20121b.bed,FMR1_Ascano2012a_hg19.bed,FMR1_Ascano2012b_hg19.bed,FUS_Nakaya2013c_hg19.bed,FUS_Nakaya2013d_hg19.bed"/>
210 <param name="input_gtf_file" value="hg19.sample.gtf"/>
211 <param name="run_annot" value="TRUE"/>
212 <param name="run_motif" value="TRUE"/>
213 <param name="genome_version" value="hg19" />
214 <output name="multi_report" file="test2_multi_set_analysis_report.html" ftype="html" compare="sim_size" delta="20000"/>
166 </test> 215 </test>
167 </tests> 216 </tests>
168 <help><![CDATA[.. class:: infomark 217 <help><![CDATA[
169 218
170 **Purpose** 219 **Introduction**
171 220
172 RNA Centric Annotation System (RCAS) automatically generates 221 RCAS is an R/Bioconductor package designed as a generic reporting tool for the functional analysis of transcriptome-wide regions of interest detected by high-throughput experiments. Such transcriptomic regions could be, for instance, signal peaks detected by CLIP-Seq analysis for protein-RNA interaction sites, RNA modification sites (alias the epitranscriptome), CAGE-tag locations, or any other collection of query regions at the level of the transcriptome. RCAS produces in-depth annotation summaries and coverage profiles based on the distribution of the query regions with respect to transcript features (exons, introns, 5’/3’ UTR regions, exon-intron boundaries, promoter regions). Moreover, RCAS can carry out functional enrichment analyses of annotated gene sets, GO terms, and de novo motif discovery. RCAS is available in the Bioconductor repository, packaged in multiple environments including Conda, Galaxy, and Guix, and as a webservice at http://rcas.mdc-berlin.de/.
173 dynamic annotations for custom input files 222
174 that contain transcriptomic target regions. 223 Currently supported genome builds are hg19 and hg38 (human), mm9 and mm10 (mouse), dm3 (fly), and ce10 (worm). Modules for annotation summaries and motif analysis are supported for each of these genome builds. GO term and gene-set enrichment analyses are supported for hg19, hg38, mm9, mm10, and dm3. ce10 is currently not supportedfor GO/GSEA modules.
175 RCAS automatically summarizes annotated features 224
176 that overlap with targets in the BED file,
177 and perform enrichment analysis of
178 Gene Ontology (GO) terms, gene set and motifs.
179 225
180 ----- 226 -----
181 227
182 .. class:: infomark
183
184 **Inputs** 228 **Inputs**
185 229
186 1. A target region file in BED format 230 1. One (single sample analysis) or several (multi sample analysis) genomic target region files in BED format
187 2. A reference annotation file in GTF format 231 2. A genome reference annotation file in GTF format
188 3. A Human Molecular Signatures Database (MSigDB) (only needed for gene set enrichment) 232 3. A human Molecular Signatures Database (MSigDB) (only in single sample analysis for gene set enrichment analysis)
189 233
190 ----- 234 -----
191 235
192 .. class:: infomark
193
194 **Outputs** 236 **Outputs**
195 237
196 The outputs consist of a dynamic HTML file and 238 The outputs consist of a dynamic HTML file (both for single and multi sample analysis) and optionally a number (depending on selected options) of tabular files (single sample analysis only).
197 a dozen of tabular files. 239 The dynamic HTML file is composed of interactive tables and figures,
198 The dynamic HTML file is composed of the interactive tables and figures,
199 which can be downloaded and viewed with a web browser. 240 which can be downloaded and viewed with a web browser.
200 241
201 The tabular files correspond to the respective figures in the HTML file, 242 The tabular files contain the RCAS analysis results, corresponding to the
202 which are the results 243 respective figures in the HTML file:
203 of different RCAS analysis, as following:
204 244
205 1. Annotation summary for query regions 245 1. Annotation summary for query regions
206 246
207 * Query regions summary 247 * Query regions summary
208 * Query gene types 248 * Query gene types
219 * GO term enrichment (biological processes) 259 * GO term enrichment (biological processes)
220 * GO term enrichment (molecular functions) 260 * GO term enrichment (molecular functions)
221 261
222 3. Gene set enrichment analysis results 262 3. Gene set enrichment analysis results
223 263
224 4. Motif analysis results]]></help> 264 4. Motif analysis results (no table output in 1.5.4.)
265
266 ]]></help>
225 <citations> 267 <citations>
226 <citation type="doi">10.1093/nar/gkx120</citation> 268 <citation type="doi">10.1093/nar/gkx120</citation>
227 </citations> 269 </citations>
228 </tool> 270 </tool>