fuma: fuma.xml comparison

comparison fuma.xml @ 2:86526900cb8f draft

planemo upload for repository https://github.com/ErasmusMC-Bioinformatics/fuma_galaxy_wrapper commit 3da3fcc0204205d4899763f9fe63edf9aa16d5a2

author	yhoogstrate
date	Mon, 12 Oct 2015 04:17:07 -0400
parents	54ce44828e1b
children	4966079d474b

comparison

equal deleted inserted replaced

-:54ce44828e1b
+:86526900cb8f
 <?xml version="1.0" encoding="UTF-8"?>
-<tool id="fuma" name="FuMa" version="2.7.1.b">
+<tool id="fuma" name="FuMa" version="2.10.0.a">
-	<description>FuMa (FusionMatcher) matches detected fusion genes based on gene name subset matching (designed in particular for RNA-Seq).</description>
+<description>match detected fusion genes based on gene names (in particular for RNA-Seq).</description>
-	<requirements>
+<requirements>
-		<requirement type="package" version="2.7.1">fuma</requirement>
+<requirement type="package" version="2.7">python</requirement>
-	</requirements>
+<requirement type="package" version="2.10.0">fuma</requirement>
+</requirements>
-	<version_command>fuma --version 2>&amp;1 | head -n 1</version_command><!-- -V also works, but is not GNU standard -->
+<version_command>fuma --version 2>&amp;1 | head -n 1</version_command><!-- -V also works, but is not GNU standard -->
-	<command>
-		#import pipes
+<command><![CDATA[
+#import pipes
-		#set $gene_annotations = []
-		#set $samples = []
+#set $gene_annotations = []
-		#set $links = []
+#set $samples = []
+#set $links = []
-		#for $i, $d in enumerate( $datasets )
+#for $i, $d in enumerate( $datasets )
-			#set $sample_name = pipes.quote(str($d['sample'].name))
+#set $sample_name = pipes.quote(str($d['sample'].name))
-			#set $gene_annotations = $gene_annotations + [ "ga_" + str($i) + ":" + str($d['gene_annotation'].file_name) ]
+#set $gene_annotations = $gene_annotations + [ "ga_" + str($i) + ":" + str($d['gene_annotation'].file_name) ]
-			#set $samples = $samples + [ $sample_name + ":" + str($d['format']) + ":" + str($d['sample'].file_name) ]
+#set $samples = $samples + [ $sample_name + ":" + str($d['format']) + ":" + str($d['sample'].file_name) ]
-			#set $links = $links + [ $sample_name + ":" + str("ga_") + str($i) ]
+#set $links = $links + [ $sample_name + ":" + str("ga_") + str($i) ]
-		#end for
+#end for
-		#set $gene_annotations_str = " ".join(gene_annotations)
+#set $gene_annotations_str = " ".join(gene_annotations)
-		#set $samples_str = " ".join(samples)
+#set $samples_str = " ".join(samples)
-		#set $links_str = " ".join(links)
+#set $links_str = " ".join(links)
-		fuma
+fuma
-		  -a
+-m
-		    $gene_annotations_str
+$params.matching_method
-		  -s
-		    $samples_str
+$params.strand_specific_matching
-		  -l
+$params.acceptor_donor_order_specific_matchig
-		    $links_str
-		#if $output_format.value == "list_boolean"
+-a
-		  -f list
+$gene_annotations_str
-		#else
+-s
-		  -f $output_format.value
+$samples_str
-		#end if
+-l
-		  -o $fuma_overview ;
+$links_str
+#if $params.output_format.value == "list_boolean"
+-f list
+#else
-		#if $output_format.value == "list_boolean"
+-f $params.output_format.value
-			fuma-list-to-boolean-list -o tmp.txt $fuma_overview &amp;&amp;
+#end if
-			mv tmp.txt $fuma_overview
+-o $fuma_overview ;
-		#end if
-	</command>
+#if $params.output_format.value == "list_boolean"
-	<inputs>
+fuma-list-to-boolean-list -o tmp.txt $fuma_overview ;
-		<repeat name="datasets" title="FusionGene Datasets" min="2">
+mv tmp.txt $fuma_overview
-			<param name="sample" type="data" format="txt,tabular" label="Dataset (RNA-Seq fusion gene detection experiment)" />
+#end if
-			<param name="format" type="select" label="Format of dataset">
+]]></command>
-				<option value="chimerascan">ChimeraScan</option>
-				<option value="defuse">DeFuse</option>
+<inputs>
-				<option value="complete-genomics">Complete Genomics</option>
+<repeat name="datasets" title="FusionGene Datasets" min="2">
-				<option value="fusion-catcher_final">Fusion Catcher (final-list file)</option>
+<param name="sample" type="data" format="txt,tabular" label="Dataset (RNA-Seq fusion gene detection experiment)" />
-				<option value="fusionmap">FusionMap</option>
+<param name="format" type="select" label="Format of dataset">
-				<option value="trinity-gmap">GMAP (As step after Trinity)</option>
+<option value="chimera">Chimera prettyPrint()</option>
-				<option value="oncofuse">OncoFuse</option>
+<option value="chimerascan">ChimeraScan</option>
-				<option value="rna-star_chimeric">STAR (chimeric file)</option>
+<option value="defuse">DeFuse</option>
-				<option value="tophat-fusion_pre">Tophat Fusion Pre (fusions.out)</option>
+<option value="complete-genomics">Complete Genomics var/mastervar</option>
-				<option value="tophat-fusion_post_potential_fusion">Tophat Fusion Post (potential_fusion.txt)</option>
+<option value="fusion-catcher_final">Fusion Catcher (final-list file)</option>
-				<option value="tophat-fusion_post_result">Tophat Fusion Post (result.txt)</option>
+<option value="fusionmap">FusionMap</option>
-			</param>
+<option value="trinity-gmap">GMAP (As step after Trinity)</option>
-			<param name="gene_annotation" type="data" format="bed" label="Corresponding gene-name annotation file (BED format)" help="Make use of persistent gene annotations! Gene annotations should only be different if different reference genome builds were used." />
+<option value="oncofuse">OncoFuse</option>
-		</repeat>
+<option value="rna-star_chimeric">STAR (chimeric file)</option>
+<option value="star-fusion_final">STAR-Fusion (candidates.final)</option>
-		<param name="output_format" type="select" label="Output format">
+<option value="tophat-fusion_pre">Tophat Fusion Pre (fusions.out)</option>
-			<option value="list_boolean" selected="true">List (Boolean)</option>
+<option value="tophat-fusion_post_potential_fusion">Tophat Fusion Post (potential_fusion.txt)</option>
-			<option value="list">List</option>
+<option value="tophat-fusion_post_result">Tophat Fusion Post (result.txt)</option>
-			<option value="summary">Count summary</option>
+<option value="tophat-fusion_post_result_html">Tophat Fusion Post (result.html)</option>
-		</param>
+</param>
-	</inputs>
+<param name="gene_annotation" type="data" format="bed" label="Corresponding gene-name annotation file (BED format)" help="Make use of persistent gene annotations! Gene annotations should only be different if different reference genome builds were used." />
+</repeat>
-	<outputs>
-		<data format="tabular" name="fuma_overview" label="${tool.name} on ${', '.join([ str(d['sample'].hid)+': '+d['sample'].name for d in $datasets ])}" />
+<conditional name="params">
-	</outputs>
+<param name="settingsType" type="select" label="Settings to use" help="You can use the default settings or set custom values for any FuMa parameter.">
+<option value="preSet" selected="true">Use Defaults</option>
-	<tests>
+<option value="full">Full parameter list</option>
-		<test>
+</param>
-			<!-- <repeat name="datasets"> -->
+<when value="preSet">
-				<param name="datasets_0|sample" value="chimerascan.txt" ftype="tabular" />
+<param name="strand_specific_matching" type="hidden" value="--strand-specific-matching" />
-				<param name="datasets_0|format" value="chimerascan" />
+<param name="acceptor_donor_order_specific_matchig" type="hidden" value="--acceptor-donor-order-specific-matching" />
-				<param name="datasets_0|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+</when>
-			<!-- </repeat> -->
+<when value="full">
-			<!-- <repeat name="datasets"> -->
+<param name="matching_method" type="select" label="Matching method: technique used to match fusion genes based on annotated gene sets" help="Overlap is the most sensitive but also more sensitive for long gene artefacts; subset is the recommended technique and EGM is conservative.">
-				<param name="datasets_1|sample" value="defuse.txt" ftype="tabular" />
+<option value="overlap">Overlap</option>
-				<param name="datasets_1|format" value="defuse" />
+<option value="subset" selected="True">Subset</option>
-				<param name="datasets_1|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<option value="egm">Exact Geneset Matching (EGM)</option>
-			<!-- </repeat> -->
+</param>
-			<!-- <repeat name="datasets"> -->
-				<param name="datasets_2|sample" value="fusion-map.txt" ftype="tabular" />
+<param name="strand_specific_matching" type="boolean" checked="True" truevalue="--strand-specific-matching" falsevalue="" label="Consider fusion genes distinct when the breakpoints have different strands" help="Only a limited number of file formats support this feature." />
-				<param name="datasets_2|format" value="fusionmap" />
+<param name="acceptor_donor_order_specific_matchig" type="boolean" checked="True" truevalue="--acceptor-donor-order-specific-matching" falsevalue="" label="Consider fusion genes distinct when the donor and acceptor sites are swapped (A,B) != (B,A)" help="This settings is not recommended when fusion genes detected in DNA-Seq are used" />
-				<param name="datasets_2|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
-			<!-- </repeat> -->
+<param name="output_format" type="select" label="Output format">
-			<!-- <repeat name="datasets"> -->
+<option value="list_boolean" selected="true">List (Boolean)</option>
-				<param name="datasets_3|sample" value="edgren_tp.txt" ftype="tabular" />
+<option value="list">List</option>
-				<param name="datasets_3|format" value="fusionmap" />
+<option value="summary">Count summary</option>
-				<param name="datasets_3|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+</param>
-			<!-- </repeat> -->
+</when>
+</conditional>
-			<param name="output_format" value="summary" />
+</inputs>
-			<output name="fuma_overview" file="output.txt" />
+<outputs>
-		</test>
+<data format="tabular" name="fuma_overview" label="${tool.name} on ${', '.join([ str(d['sample'].hid)+': '+d['sample'].name for d in $datasets ])}" />
-	</tests>
+</outputs>
-	<help>============
+<tests>
+<test>
+<!-- <repeat name="datasets"> -->
+<param name="datasets_0|sample" value="chimerascan.txt" ftype="tabular" />
+<param name="datasets_0|format" value="chimerascan" />
+<param name="datasets_0|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_1|sample" value="defuse.txt" ftype="tabular" />
+<param name="datasets_1|format" value="defuse" />
+<param name="datasets_1|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_2|sample" value="fusion-map.txt" ftype="tabular" />
+<param name="datasets_2|format" value="fusionmap" />
+<param name="datasets_2|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_3|sample" value="edgren_tp.txt" ftype="tabular" />
+<param name="datasets_3|format" value="fusionmap" />
+<param name="datasets_3|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<param name="settingsType" value="full" />
+<param name="matching_method" value="subset" />
+<param name="strand_specific_matching" value="--strand-specific-matching" />
+<param name="acceptor_donor_order_specific_matchig" value="--acceptor-donor-order-specific-matching" />
+<param name="output_format" value="list_boolean" />
+<output name="fuma_overview" file="output_test_1.txt" />
+</test>
+<test>
+<!-- <repeat name="datasets"> -->
+<param name="datasets_0|sample" value="chimerascan.txt" ftype="tabular" />
+<param name="datasets_0|format" value="chimerascan" />
+<param name="datasets_0|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_1|sample" value="defuse.txt" ftype="tabular" />
+<param name="datasets_1|format" value="defuse" />
+<param name="datasets_1|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_2|sample" value="fusion-map.txt" ftype="tabular" />
+<param name="datasets_2|format" value="fusionmap" />
+<param name="datasets_2|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<!-- <repeat name="datasets"> -->
+<param name="datasets_3|sample" value="edgren_tp.txt" ftype="tabular" />
+<param name="datasets_3|format" value="fusionmap" />
+<param name="datasets_3|gene_annotation" value="refseq_genes_hg19.bed" ftype="bed" />
+<!-- </repeat> -->
+<param name="settingsType" value="full" />
+<param name="matching_method" value="subset" />
+<param name="strand_specific_matching" value="" />
+<param name="acceptor_donor_order_specific_matchig" value="" />
+<param name="output_format" value="list_boolean" />
+<output name="fuma_overview" file="output_test_2.txt" />
+</test>
+</tests>
+<help><![CDATA[
+============
 Introduction
 ============
 FuMa (Fusion Matcher) matches predicted fusion events (both genomic and transcriptomic) according to chromosomal location or assocatiated gene annotation(s) where the latter should be genome build inspecific.
 *******
 +-------------------+-----------------------+-------------------------------------+
 |Tools              | File                  | Format string                       |
 +===================+=======================+=====================================+
+|Chimera            | prettyPrint() output  | chimera                             |
++-------------------+-----------------------+-------------------------------------+
 |ChimeraScan        | chimeras.bedpe        | chimerascan                         |
 +-------------------+-----------------------+-------------------------------------+
 |Complete Genomics  | highConfidenceJu*.tsv | complete-genomics                   |
 +-------------------+-----------------------+-------------------------------------+
 |Complete Genomics  | allJunctionsBeta*.tsv | complete-genomics                   |
 +-------------------+-----------------------+-------------------------------------+
 |OncoFuse           |                       | oncofuse                            |
 +-------------------+-----------------------+-------------------------------------+
 |RNA STAR           | Chimeric.out.junction | rna-star_chimeric                   |
 +-------------------+-----------------------+-------------------------------------+
+|STAR Fusion        | _candidates.final     | star-fusion_final                   |
++-------------------+-----------------------+-------------------------------------+
 |TopHat Fusion pre  | fusions.out           | tophat-fusion_pre                   |
 +-------------------+-----------------------+-------------------------------------+
 |TopHat Fusion post | potential_fusion.txt  | tophat-fusion_post_potential_fusion |
 +-------------------+-----------------------+-------------------------------------+
 |TopHat Fusion post | result.txt            | tophat-fusion_post_result           |
 +-------------------+-----------------------+-------------------------------------+
+|TopHat Fusion post | result.html           | tophat-fusion_post_result_html      |
++-------------------+-----------------------+-------------------------------------+
 To annotate genes upon the breakpoints you must provide a BED file that contains gene annotations for the user genome build. Make sure **your BED file contains one gene per line**. You should use BED files that contain one exon per line only if you want restrict your analysis to fusion genes detected within exons.
 UCSC genome browser provides a very simple way of obtaining BED files with one gene per line by selecting their *RefSeq Genes*-track and *knownGene*-table and putting the export format to BED. Galaxy should have a built-in UCSC table browser.
-	</help>
+]]></help>
-	<citations>
+<citations>
-	</citations>
+<citation type="bibtex">
+@unpublished{fuma,
+author       = {Youri Hoogstrate},
+title        = {FuMa: reporting overlap in RNA-seq detected fusion genes},
+url          = { https://github.com/yhoogstrate/fuma }
+}
+</citation>
+</citations>
 </tool>

Mercurial > repos > yhoogstrate > fuma

comparison fuma.xml @ 2:86526900cb8f draft