Mercurial > repos > rnateam > graphclust_fasta_to_gspan
diff fasta2shrep_gspan.xml @ 0:b6e6830ff06b draft
planemo upload for repository https://github.com/eteriSokhoyan/galaxytools/tree/branchForIterations/tools/GraphClust/GSPAN commit 21aaee40723b5341b4236edeb0e72995c2054053
author | rnateam |
---|---|
date | Fri, 16 Dec 2016 07:35:04 -0500 |
parents | |
children | 358c52752305 |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/fasta2shrep_gspan.xml Fri Dec 16 07:35:04 2016 -0500 @@ -0,0 +1,98 @@ +<tool id="gspan" name="fasta_to_gspan" version="0.1"> + <requirements> + <requirement type="package" version="0.1">graphclust-wrappers</requirement> + <requirement type="package" version="2.1.6">rnashapes</requirement> + </requirements> + <stdio> + <exit_code range="1:" /> + </stdio> + <command> + <![CDATA[ + + 'fasta2shrep_gspan.pl' --fasta '$dataFasta' $i_crop_unpaired_ends $i_abstr $i_stacks -t "3=0,5=80" -M $M -c $rel_energy_range -win $wins -shift $shift $u $seq_graph_t --group $group + +]]> + </command> + <inputs> + <param type="data" name="dataFasta" format="fasta" /> + <param name="i_stacks" truevalue="-stack" falsevalue="" checked="True" type="boolean" label="Add stacking information to graphs." help="-stack"/> + <param name="i_abstr" truevalue="-abstr" falsevalue="" type="boolean" label="Add abstract structure graphs to the single shrep graph instances." help="-abstr"/> + <param name="i_crop_unpaired_ends" truevalue="-cue" falsevalue="" type="boolean" label="Add abstract structure graphs to the single shrep graph instances." help="-cue"/> + <param name="M" type="integer" value="5" size="7" label="Max number of shreps that should be taken per window." help="-M"/> + <param name="rel_energy_range" type="integer" value="20" size="7" label=" Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes)" help="-c"/> + <param name="wins" type="text" value="40,150" size="20" label=" A list of window sizes to use" help="comma separated integers"/> + <param name="shift" type="integer" value="30" size="7" label="The shift of the window, relative to the window size given inpercent." help="by default 30"/> + <param name="u" truevalue="-u" falsevalue="" checked="True" type="boolean" label="Ignore unstable structures (RNAshapes)" help="-u"/> + <param name="seq_graph_t" truevalue="--seq-graph-t" falsevalue="" checked="True" type="boolean" label="Add for each 't #' a graph which contains no structure" help="--seq-graph-t"/> + <param name="group" type="integer" value="10000" size="7" label="Group size." help="by default 10000"/> + </inputs> + <outputs> + <data name="gspan.zip" format="searchgui_archive" from_work_dir="GSPAN_Outputs/1.group.gspan.bz2" label="gspan zip" /> + </outputs> + <tests> + <test> + <param name="dataFasta" value="data.fasta"/> + <output name="gspan.zip" file="GSPAN_Outputs/1.group.gspan.bz2" /> + </test> + </tests> + <help> + <![CDATA[ + +**What it does** + +For each fragment of input sequence we use RNAshapes to create a set of structures. +The default parameters for example consider for each input fragment again a +window of size 40nt and 150nt with a window shift of 30%. This allows to +consider local structures as well as global structures for a fragment. +From each such RNAshape window we take the top 5 shreps (suboptimal +structures for the top 5 shapes) within 20% of the mfe energy of that window +and convert them into graphs. +As shape level (abstraction level) we use 3 for short sequences and 5 for +sequences >= 80nt. Please see also RNAshapes documentation for all these +terms. + + +**Parameters** + ++ **input** : Sequences in Fasta format. + ++ **stack** : This adds an additional vertex (type P) for each pair of stacked base-pairs and four edges + (type p) from each of the involved bases to the new vertex. + ++ **abstr** : Add abstract structure graphs to the single shrep graph instances. + ++ **cue** : Crop unpaired ends. If you give this flag, then the unpaired ends of each single structure are ignored. E.g. the structure + ...(((...))).. becomes just (((...))) + ++ **M** : Max number of shreps that should be taken per window. + ++ **c** : Relative energy range, i.e. percentage (%) of MFE energy (RNAshapes) Use only one of -e and -c! + ++ **wins** : A list of window sizes to use. If none are given (empty string ''), then the entire sequence is taken with no windows. Each window > 1 required! + ++ **shift** : The shift of the window, relative to the window size given in percent. So you give which percent of the window size shall be + used for the shift. Of course the shift is rounded down to the + nearest whole number. + Example 20 % of a window 150 would result in a step size of 30 nt. + It is a relative parameter, as you can give different window sizes. + If you do not give this parameter there is a default shift of 1 nt. + ++ **u** : Ignore unstable structures (RNAshapes). This option filters out closed structures with positive free energy. + ++ **seq-graph-t** : Add for each 't #' a graph which contains no structure + ++ **group** : Combine/group that number of input seqs into 1 gspan file output name is then '<INT>.group.gspan.bz2' + + ]]> + </help> + <citations> + <citation type="doi">10.1093/bioinformatics/bts224</citation> + <citation type="bibtex">@article{jan:gie:2015, +author={Janssen, Stefan and Giegerich, Robert}, +title={The RNA shapes studio}, +journal={Bioinformatics}, +year={2015}, +doi={10.1093/bioinformatics/btu649}, +url={http://bioinformatics.oxfordjournals.org/content/31/3/423.abstract}}</citation> + </citations> +</tool>