retrieve_ensembl_bed: retrieve_ensembl

comparison retrieve_ensembl_bed.xml @ 1:9c4a48f5d4e7 draft default tip

"planemo upload for repository https://github.com/galaxyproteomics/tools-galaxyp/tree/master/tools/proteogenomics/retrieve_ensembl_bed commit 6babd357845126292cb202aaea0f70ff68819525"

author	galaxyp
date	Mon, 07 Oct 2019 16:14:39 -0400
parents	da1b538b87e5
children

comparison

equal deleted inserted replaced

-:da1b538b87e5
+:9c4a48f5d4e7
 --biotypes '$biotypes'
 #end if
 #if $regions:
 --regions '$regions'
 #end if
+#if $interval_file:
+#if $interval_file.ext.find('bed') > -1
+--interval_format bed
+#elif $interval_file.ext in ['gff','gtf','gff3']
+--interval_format gff
+#else
+--interval_format interval
+#end if
+--interval_file '$interval_file'
+#end if
 '$transcript_bed'
 ]]></command>
 <inputs>
 <param name="species" type="text" value="" label="Ensembl species" >
 <help>
 </param>
 <param name="regions" type="text" value="" optional="true" label="Restrict Feature retrieval to comma-separated list of regions" >
 <help>Each region is specifed as: chr or chr:pos or chr:from-to</help>
 <validator type="regex" message="">^(\w+(:\d+(-\d+)?)?(,\w+(:\d+(-\d+)?)?)*)?$</validator>
 </param>
+<param name="interval_file" type="data" format="bed,gff,interval" label="Retrieve the intervals from this file" optional="true"/>
 </inputs>
 <outputs>
 <data name="transcript_bed" format="bed" label="Ensembl ${species} transcripts.bed">
 <actions>
 <action name="column_names" type="metadata"
 <assert_contents>
 <has_text_matching expression="(chr)?1\t\d+\t\d+\tENST" />
 </assert_contents>
 </output>
 </test>
+<test>
+<param name="species" value="mouse"/>
+<param name="biotypes" value="protein_coding"/>
+<param name="interval_file" ftype="bed" value="test.bed"/>
+<output name="transcript_bed">
+<assert_contents>
+<has_text_matching expression="(chr)?1\t\d+\t\d+\tENSMUST" />
+</assert_contents>
+</output>
+</test>
 </tests>
 <help><![CDATA[
 Retrieve Ensembl cDNAs in BED format
 usage: retrieve_ensembl_bed.py [-h] [-s SPECIES] [-R REGIONS] [-B BIOTYPES]
 [-X] [-U] [-t] [-v] [-d]
 output
 positional arguments:
-output                Output BED filepath, or for stdout: "-"
+output                   Output BED filepath, or for stdout: "-"
 optional arguments:
--h, --help            show this help message and exit
+-h, --help               show this help message and exit
 -s SPECIES, --species SPECIES
 Ensembl Species to retrieve
 -R REGIONS, --regions REGIONS
-Restrict Ensembl retrieval to regions e.g.:
+Restrict Ensembl retrieval to regions e.g.
 X,2:20000-25000,3:100-500+
+-i INTERVAL_FILE, --interval_file INTERVAL_FILE
+Regions from a bed, gff, or interval file
+-f {bed,gff,interval},  --interval_format {bed,gff,interval}
+Interval format has TAB-separated
+columns: Seq, Start, End, Strand
 -B BIOTYPES, --biotypes BIOTYPES
 Restrict Ensembl biotypes to retrieve
--X, --extended_bed    Include the extended columns returned from Ensembl
+-X, --extended_bed       Include the extended columns returned from Ensembl
 -U, --ucsc_chrom_names
 Use the UCSC names for Chromosomes
--t, --toplevel        Print Ensembl toplevel for species
+-t, --toplevel           Print Ensembl toplevel for species
--v, --verbose         Verbose
+-v, --verbose            Verbose
--d, --debug           Debug
+-d, --debug              Debug
+**Output**
 Ensembl REST API returns an extended BED format with these additional columns::
 second_name, cds_start_status, cds_end_status, exon_frames, type, gene_name, second_gene_name, gene_type

Mercurial > repos > galaxyp > retrieve_ensembl_bed

comparison retrieve_ensembl_bed.xml @ 1:9c4a48f5d4e7 draft default tip