Mercurial > repos > crs4 > edge_pro
diff edge_pro.xml @ 0:7af33315bc5e draft
Uploaded
author | crs4 |
---|---|
date | Mon, 09 Sep 2013 06:11:47 -0400 |
parents | |
children | f77ce4f92b46 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/edge_pro.xml Mon Sep 09 06:11:47 2013 -0400 @@ -0,0 +1,133 @@ +<tool id="edge_pro" name="EDGE-pro" version="1.0.0"> + <description>Gene expression in Prokaryotes</description> + <requirements> + <requirement type="package" version="1.3.1">edge-pro</requirement> + </requirements> + <command interpreter="python"> + edge_pro.py + \${EDGE_PRO_SITE_OPTIONS:---num-threads=4} + + ## Mandatory input parameters + --genome $genome + --ptt $ptt + --rnt $rnt + ## First input file always required + --input1 $singlePaired.input1 + ## Second input only if input is paired-end + #if $singlePaired.sPaired == "paired" + --input2=$singlePaired.input2 + #end if + + ## Optional input parameters + #if $params.settingsType == "full" + #if str($params.minInsertSize) + --minInsertSize=$params.minInsertSize + #end if + #if str($params.maxInsertSize) + --maxInsertSize=$params.maxInsertSize + #end if + #if str($params.window) + --window=$params.window + #end if + #if str($params.utrSize) + --utrSize=$params.utrSize + #end if + #if str($params.similarity) + --similarity=$params.similarity + #end if + #if str($params.readLength) + --readLength=$params.readLength + #end if + #if str($params.minCoverage) + --minCoverage=$params.minCoverage + #end if + #end if + + ## Outputs + --out-aln $out_aln + --out-rpkm $out_rpkm + --out-log $out_log + </command> + <inputs> + <conditional name="singlePaired"> + <param name="sPaired" type="select" label="Is this library mate-paired?"> + <option value="single">Single-end</option> + <option value="paired">Paired-end</option> + </param> + <when value="single"> + <param format="fastqsanger" name="input1" type="data" label="FASTQ file" help="FASTQ format with Sanger-scaled quality values (Galaxy fastqsanger datatype)"/> + </when> + <when value="paired"> + <param format="fastqsanger" name="input1" type="data" label="Forward FASTQ file" help="FASTQ format with Sanger-scaled quality values (Galaxy fastqsanger datatype)" /> + <param format="fastqsanger" name="input2" type="data" label="Reverse FASTQ file" help="FASTQ format with Sanger-scaled quality values (Galaxy fastqsanger datatype)" /> + </when> + </conditional> + + <param format="fasta" name="genome" type="data" label="Select the reference genome from your history (-g)" help="FASTA format" /> + <param format="ptt" name="ptt" type="data" label="Coordinates of coding genes (PTT file)" help="PTT file with coordinates of coding genes (-p)" /> + <param format="rnt" name="rnt" type="data" label="Coordinates of structural RNAs (RNT file)" help="RNT file with coordinates of structural RNA (-r)" /> + + <conditional name="params"> + <param name="settingsType" type="select" label="Parameter settings" help="For most needs, use default settings. If you want full control use Full Parameter List"> + <option value="preSet">Use Defaults</option> + <option value="full">Full parameter list</option> + </param> + <when value="preSet" /> + <!-- Full/advanced params. --> + <when value="full"> + <param name="minInsertSize" type="integer" optional="true" value="0" label="Minimun insert size for a read pair (-m)" help="For paired-end reads only" /> + <param name="maxInsertSize" type="integer" optional="true" value="500" label="Maximun insert size for a read pair (-M)" help="For paired-end reads only" /> + <param name="window" type="integer" optional="true" value="100" label="Window length for coverage distribution (-w)" help="Used to distribute the coverage between two overlapping genes. See help below for details" /> + <param name="utrSize" type="integer" optional="true" value="40" label="Size of the untranslated region (-i)" help="Enter the size of the untranslated region between the initial transcription site and the start codon" /> + <param name="similarity" type="float" optional="true" value="0.15" label="Percentage for similar coverage (-x)" help="Enter the percentage used to determine when two coverage values are considered similar. See help below for details" /> + <param name="readLength" type="integer" optional="true" value="" label="Read length (-l)" help="If not specified, the first 1000 reads are used to approximate the read length" /> + <param name="minCoverage" type="integer" optional="true" value="3" label="Minimum average coverage for expressed genes (-c)" help="Coverage less than specified is assumed to be noise and gene is considered to not be expressed" /> + </when> <!-- full --> + </conditional> + </inputs> + + <outputs> + <data format="sam" name="out_aln" label="${tool.name} on ${on_string}: alignment"/> + <data format="tabular" name="out_rpkm" label="${tool.name} on ${on_string}: rpkm"/> + <data format="txt" name="out_log" label="${tool.name} on ${on_string}: log"/> + </outputs> + + <help> + +**What it does** + +`EDGE-pro`_, Estimated Degree of Gene Expression in PROkaryots is an efficient software system to estimate gene expression levels in prokaryotic genomes from RNA-seq data. EDGE-pro uses Bowtie2 for alignment and then estimates expression directly from the alignment results. +EDGE-pro includes routines to assign reads aligning to overlapping gene regions accurately. 15% or more of bacterial genes overlap other genes, making this a significant problem for bacterial RNA-seq, one that is generally ignored by programs designed for eukaryotic RNA-seq experiments. + +**Input files:** + +.. class:: infomark + +Input files with gene coordinates in PTT and RNT format can be retrieved with the Get EDGE-pro Files tool available in Galaxy, or downloaded from the `NCBI ftp repository`_. +This tool accepts files in Sanger FASTQ format (Galaxy *fastqsanger* datatype). Use the FASTQ Groomer tool to prepare your files. + +.. _NCBI ftp repository: ftp://ftp.ncbi.nlm.nih.gov/genomes/Bacteria/ + +.. class:: warningmark + +All 3 types of files (FASTA reference genome, PTT and RNT) must have the same order of chromosomes/plasmids (e.g. if chr1 is before chr2 in genome.fasta file, then chr1 must be before chr2 in ptt and rnt files as well). If there is no PTT or RNT file for one of chromosomes/plasmids, place this chromosome/plasmid at the end of the file. + +**License and citation** + +This Galaxy tool is Copyright © 2012-2013 `CRS4 Srl.`_ and is released under the `MIT license`_. + +.. _CRS4 Srl.: http://www.crs4.it/ +.. _MIT license: http://opensource.org/licenses/MIT + +If you use this tool in Galaxy, please cite |Cuccuru2013|_. + +.. |Cuccuru2013| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2013) Orione, a web-based framework for NGS analysis in microbiology. *Submitted* +.. _Cuccuru2013: http://orione.crs4.it/ + +This tool uses `EDGE-pro`_, which is licensed separately. Please cite |Magoc2013|_. + +.. _EDGE-pro: http://ccb.jhu.edu/software/EDGE-pro/ +.. |Magoc2013| replace:: Magoc, T., Wood, D., Salzberg, S. L. (2013) EDGE-pro: Estimated Degree of Gene Expression in Prokaryotic Genomes. *Evol. Bioinform.* 2013:9, 127-136 +.. _Magoc2013: http://www.la-press.com/edge-pro-estimated-degree-of-gene-expression-in-prokaryotic-genomes-article-a3586 + </help> +</tool>