annotate iAssembler.xml @ 4:00edccfa662b draft

iAssembler perl wrapper
author rogerngo
date Wed, 16 May 2012 00:24:20 -0400
parents f8037d6c5f14
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
1 <tool id="iAssembler" name="iAssembler" version="1.3">
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
2 <description>Assembly of transcriptomes.</description>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
3 <requirements>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
4 <requirement type="package">iAssembler</requirement>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
5 </requirements>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
6 <command interpreter="perl">
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
7 iAssembler_wrapper.pl -i $input -e $maxlength -h $minoverlap -p $minpercent
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
8 </command>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
9 <inputs>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
10 <param name="input" format="fasta" type="data" label="nucleotide fasta file"/>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
11 <param name="maxlength" type="integer" value="30" label="maximum length of end clips (6~100; default = 30)"/>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
12 <param name="minoverlap" type="integer" value="40" label="minimum overlap length (>=30; default = 40)"/>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
13 <param name="minpercent" type="integer" value="97" label="minimum percent identity for sequence clustering and assembly (95~100; default = 97)"/>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
14 </inputs>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
15 <outputs>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
16 <data format="fasta" name="Assembled" from_work_dir="unigene_seq.fasta"/>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
17 </outputs>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
18 <tests>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
19 </tests>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
20 <help>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
21 iAssembler is a standalone package to assemble ESTs generated using Sanger and/or Roche-454 pyrosequencing technologies into contigs. The pipeline gives much higher accuracy in EST assembly than other existing assemblers by employing an iterative assembly strategy and automated error corrections of mis-assemblies. iAssembler first performs iterative assemblies using MIRA and CAP3 (default: four cycles of MIRA assemblies followed by one CAP3 assembly) to correct assembly errors (mostly sequences derived from the same transcript fail to be assembled together) which occur frequently in just one round of assembly. The program then performs post-assembly quality checking by 1) aligning each EST sequence to its corresponding unigene sequence to identify mis-assemblies; and 2) performing all-verus-all pair-wise sequence alignments of unigenes to identify sequences derived from same transcripts that fail to be assembled together. The identified mis-assemblies are then corrected by the program automatically.
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
22
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
23 http://bioinfo.bti.cornell.edu/tool/iAssembler/
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
24
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
25 Citation:
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
26 Zheng Y, Zhao L, Gao J, Fei Z. (2011) iAssembler: a package for de novo assembly of Roche-454/Sanger transcriptome sequences. BMC Bioinformatics 12:453
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
27 </help>
f8037d6c5f14 Galaxy XML
rogerngo
parents:
diff changeset
28 </tool>