annotate tools/maf/maf_to_fasta.xml @ 2:c2a356708570

Uploaded
author xuebing
date Fri, 09 Mar 2012 19:45:42 -0500
parents 9071e359b9a3
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
1 <tool id="MAF_To_Fasta1" name="MAF to FASTA" version="1.0.1">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
2 <description>Converts a MAF formatted file to FASTA format</description>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
3 <command interpreter="python">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
4 #if $fasta_target_type.fasta_type == "multiple" #maf_to_fasta_multiple_sets.py $input1 $out_file1 $fasta_target_type.species $fasta_target_type.complete_blocks
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
5 #else #maf_to_fasta_concat.py $fasta_target_type.species $input1 $out_file1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
6 #end if#
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
7 </command>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
8 <inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
9 <param format="maf" name="input1" type="data" label="MAF file to convert"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
10 <conditional name="fasta_target_type">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
11 <param name="fasta_type" type="select" label="Type of FASTA Output">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
12 <option value="multiple" selected="true">Multiple Blocks</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
13 <option value="concatenated">One Sequence per Species</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
14 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
15 <when value="multiple">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
16 <param name="species" type="select" label="Select species" display="checkboxes" multiple="true" help="checked taxa will be included in the output">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
17 <options>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
18 <filter type="data_meta" ref="input1" key="species" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
19 </options>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
20 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
21 <param name="complete_blocks" type="select" label="Choose to">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
22 <option value="partial_allowed">include blocks with missing species</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
23 <option value="partial_disallowed">exclude blocks with missing species</option>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
24 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
25 </when>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
26 <when value="concatenated">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
27 <param name="species" type="select" label="Species to extract" display="checkboxes" multiple="true">
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
28 <options>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
29 <filter type="data_meta" ref="input1" key="species" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
30 </options>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
31 </param>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
32 </when>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
33 </conditional>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
34 </inputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
35 <outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
36 <data format="fasta" name="out_file1" />
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
37 </outputs>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
38 <tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
39 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
40 <param name="input1" value="3.maf" ftype="maf"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
41 <param name="fasta_type" value="concatenated"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
42 <param name="species" value="canFam1"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
43 <output name="out_file1" file="cf_maf2fasta_concat.dat" ftype="fasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
44 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
45 <test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
46 <param name="input1" value="4.maf" ftype="maf"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
47 <param name="fasta_type" value="multiple"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
48 <param name="species" value="hg17,panTro1,rheMac2,rn3,mm7,canFam2,bosTau2,dasNov1"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
49 <param name="complete_blocks" value="partial_allowed"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
50 <output name="out_file1" file="cf_maf2fasta_new.dat" ftype="fasta"/>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
51 </test>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
52 </tests>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
53 <help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
54
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
55 **Types of MAF to FASTA conversion**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
56
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
57 * **Multiple Blocks** converts a single MAF block to a single FASTA block. For example, if you have 6 MAF blocks, they will be converted to 6 FASTA blocks.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
58 * **One Sequence per Species** converts MAF blocks to a single aggregated FASTA block. For example, if you have 6 MAF blocks, they will be converted and concatenated into a single FASTA block.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
59
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
60 -------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
61
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
62 **What it does**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
63
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
64 This tool converts MAF blocks to FASTA format and concatenates them into a single FASTA block or outputs multiple FASTA blocks separated by empty lines.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
65
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
66 The interface for this tool contains two pages (steps):
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
67
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
68 * **Step 1 of 2**. Choose multiple alignments from history to be converted to FASTA format.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
69 * **Step 2 of 2**. Choose the type of output as well as the species from the alignment to be included in the output.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
70
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
71 Multiple Block output has additional options:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
72
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
73 * **Choose species** - the tool reads the alignment provided during Step 1 and generates a list of species contained within that alignment. Using checkboxes you can specify taxa to be included in the output (all species are selected by default).
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
74 * **Choose to include/exclude blocks with missing species** - if an alignment block does not contain any one of the species you selected within **Choose species** menu and this option is set to **exclude blocks with missing species**, then such a block **will not** be included in the output (see **Example 2** below). For example, if you want to extract human, mouse, and rat from a series of alignments and one of the blocks does not contain mouse sequence, then this block will not be converted to FASTA and will not be returned.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
75
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
76
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
77 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
78
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
79 **Example 1**:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
80
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
81 In the concatenated approach, the following alignment::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
82
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
83 ##maf version=1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
84 a score=68686.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
85 s hg18.chr20 56827368 75 + 62435964 GACAGGGTGCATCTGGGAGGG---CCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
86 s panTro2.chr20 56528685 75 + 62293572 GACAGGGTGCATCTGAGAGGG---CCTGCCAGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
87 s rheMac2.chr10 89144112 69 - 94855758 GACAGGGTGCATCTGAGAGGG---CCTGCTGGGCCTTTG-TTCAAAACTAGATATGCCCCAACTCCAATTCTA-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
88 s mm8.chr2 173910832 61 + 181976762 AGAAGGATCCACCT------------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
89 s canFam2.chr24 46551822 67 + 50763139 CG------GCGTCTGTAAGGGGCCACCGCCCGGCCTGTG-CTCAAAGCTACAAATGACTCAACTCCCAACCGA------C
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
90
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
91 a score=10289.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
92 s hg18.chr20 56827443 37 + 62435964 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
93 s panTro2.chr20 56528760 37 + 62293572 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
94 s rheMac2.chr10 89144181 37 - 94855758 ATGTGCGGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
95
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
96 will be converted to (**note** that because mm8 (mouse) and canFam2 (dog) are absent from the second block, they are replaced with gaps after concatenation)::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
97
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
98 &gt;canFam2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
99 CG------GCGTCTGTAAGGGGCCACCGCCCGGCCTGTG-CTCAAAGCTACAAATGACTCAACTCCCAACCGA------C-------------------------------------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
100 &gt;hg18
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
101 GACAGGGTGCATCTGGGAGGG---CCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
102 &gt;mm8
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
103 AGAAGGATCCACCT------------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC--------------------------------------------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
104 &gt;panTro2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
105 GACAGGGTGCATCTGAGAGGG---CCTGCCAGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
106 &gt;rheMac2
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
107 GACAGGGTGCATCTGAGAGGG---CCTGCTGGGCCTTTG-TTCAAAACTAGATATGCCCCAACTCCAATTCTA-------ATGTGCGGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
108
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
109 ------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
110
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
111 **Example 2a**: Multiple Block Approach **Include all species** and **include blocks with missing species**:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
112
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
113 The following alignment::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
114
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
115 ##maf version=1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
116 a score=68686.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
117 s hg18.chr20 56827368 75 + 62435964 GACAGGGTGCATCTGGGAGGG---CCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
118 s panTro2.chr20 56528685 75 + 62293572 GACAGGGTGCATCTGAGAGGG---CCTGCCAGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
119 s rheMac2.chr10 89144112 69 - 94855758 GACAGGGTGCATCTGAGAGGG---CCTGCTGGGCCTTTG-TTCAAAACTAGATATGCCCCAACTCCAATTCTA-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
120 s mm8.chr2 173910832 61 + 181976762 AGAAGGATCCACCT------------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
121 s canFam2.chr24 46551822 67 + 50763139 CG------GCGTCTGTAAGGGGCCACCGCCCGGCCTGTG-CTCAAAGCTACAAATGACTCAACTCCCAACCGA------C
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
122
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
123 a score=10289.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
124 s hg18.chr20 56827443 37 + 62435964 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
125 s panTro2.chr20 56528760 37 + 62293572 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
126 s rheMac2.chr10 89144181 37 - 94855758 ATGTGCGGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
127
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
128 will be converted to::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
129
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
130 &gt;hg18.chr20(+):56827368-56827443|hg18_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
131 GACAGGGTGCATCTGGGAGGG---CCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
132 &gt;panTro2.chr20(+):56528685-56528760|panTro2_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
133 GACAGGGTGCATCTGAGAGGG---CCTGCCAGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
134 &gt;rheMac2.chr10(-):89144112-89144181|rheMac2_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
135 GACAGGGTGCATCTGAGAGGG---CCTGCTGGGCCTTTG-TTCAAAACTAGATATGCCCCAACTCCAATTCTA-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
136 &gt;mm8.chr2(+):173910832-173910893|mm8_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
137 AGAAGGATCCACCT------------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
138 &gt;canFam2.chr24(+):46551822-46551889|canFam2_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
139 CG------GCGTCTGTAAGGGGCCACCGCCCGGCCTGTG-CTCAAAGCTACAAATGACTCAACTCCCAACCGA------C
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
140
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
141 &gt;hg18.chr20(+):56827443-56827480|hg18_1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
142 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
143 &gt;panTro2.chr20(+):56528760-56528797|panTro2_1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
144 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
145 &gt;rheMac2.chr10(-):89144181-89144218|rheMac2_1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
146 ATGTGCGGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
147
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
148 -----
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
149
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
150 **Example 2b**: Multiple Block Approach **Include hg18 and mm8** and **exclude blocks with missing species**:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
151
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
152 The following alignment::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
153
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
154 ##maf version=1
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
155 a score=68686.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
156 s hg18.chr20 56827368 75 + 62435964 GACAGGGTGCATCTGGGAGGG---CCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
157 s panTro2.chr20 56528685 75 + 62293572 GACAGGGTGCATCTGAGAGGG---CCTGCCAGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC-
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
158 s rheMac2.chr10 89144112 69 - 94855758 GACAGGGTGCATCTGAGAGGG---CCTGCTGGGCCTTTG-TTCAAAACTAGATATGCCCCAACTCCAATTCTA-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
159 s mm8.chr2 173910832 61 + 181976762 AGAAGGATCCACCT------------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC-------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
160 s canFam2.chr24 46551822 67 + 50763139 CG------GCGTCTGTAAGGGGCCACCGCCCGGCCTGTG-CTCAAAGCTACAAATGACTCAACTCCCAACCGA------C
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
161
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
162 a score=10289.000000
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
163 s hg18.chr20 56827443 37 + 62435964 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
164 s panTro2.chr20 56528760 37 + 62293572 ATGTGCAGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
165 s rheMac2.chr10 89144181 37 - 94855758 ATGTGCGGAAAATGTGATACAGAAACCTGCAGAGCAG
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
166
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
167 will be converted to (**note** that the second MAF block, which does not have mm8, is not included in the output)::
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
168
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
169 &gt;hg18.chr20(+):56827368-56827443|hg18_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
170 GACAGGGTGCATCTGGGAGGGCCTGCCGGGCCTTTA-TTCAACACTAGATACGCCCCATCTCCAATTCTAATGGAC
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
171 &gt;mm8.chr2(+):173910832-173910893|mm8_0
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
172 AGAAGGATCCACCT---------TGCTGGGCCTCTGCTCCAGCAAGACCCACCTCCCAACTCAAATGCCC------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
173
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
174 ------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
175
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
176 .. class:: infomark
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
177
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
178 **About formats**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
179
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
180 **MAF format** multiple alignment format file. This format stores multiple alignments at the DNA level between entire genomes.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
181
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
182 - The .maf format is line-oriented. Each multiple alignment ends with a blank line.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
183 - Each sequence in an alignment is on a single line.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
184 - Lines starting with # are considered to be comments.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
185 - Each multiple alignment is in a separate paragraph that begins with an "a" line and contains an "s" line for each sequence in the multiple alignment.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
186 - Some MAF files may contain two optional line types:
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
187
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
188 - An "i" line containing information about what is in the aligned species DNA before and after the immediately preceding "s" line;
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
189 - An "e" line containing information about the size of the gap between the alignments that span the current block.
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
190
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
191 ------
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
192
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
193 **Citation**
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
194
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
195 If you use this tool, please cite `Blankenberg D, Taylor J, Nekrutenko A; The Galaxy Team. Making whole genome multiple alignments usable for biologists. Bioinformatics. 2011 Sep 1;27(17):2426-2428. &lt;http://www.ncbi.nlm.nih.gov/pubmed/21775304&gt;`_
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
196
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
197
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
198 </help>
9071e359b9a3 Uploaded
xuebing
parents:
diff changeset
199 </tool>