Mercurial > repos > iuc > bedtools
comparison getfastaBed.xml @ 1:82aac94b06c3 draft
Uploaded
author | iuc |
---|---|
date | Thu, 08 Jan 2015 14:25:51 -0500 |
parents | b8348686a0b9 |
children | 607c0576c6ab |
comparison
equal
deleted
inserted
replaced
0:b8348686a0b9 | 1:82aac94b06c3 |
---|---|
4 <import>macros.xml</import> | 4 <import>macros.xml</import> |
5 </macros> | 5 </macros> |
6 <expand macro="requirements" /> | 6 <expand macro="requirements" /> |
7 <expand macro="stdio" /> | 7 <expand macro="stdio" /> |
8 <command> | 8 <command> |
9 <![CDATA[ | |
9 bedtools getfasta | 10 bedtools getfasta |
10 $name | 11 $name |
11 $tab | 12 $tab |
12 $strand | 13 $strand |
13 $split | 14 $split |
14 -fi $fasta | 15 -fi $fasta |
15 -bed $inputA | 16 -bed $input |
16 -fo $output | 17 -fo $output |
18 ]]> | |
17 </command> | 19 </command> |
18 <inputs> | 20 <inputs> |
19 <param format="bed,vcf,gff,gff3" name="inputA" type="data" label="BED/VCF/GFF file" /> | 21 <param format="bed,vcf,gff,gff3" name="input" type="data" label="BED/VCF/GFF file" /> |
20 <param format="fasta" name="fasta" type="data" label="Fasta file" /> | 22 <param format="fasta" name="fasta" type="data" label="Fasta file" /> |
21 <param name="name" type="boolean" checked="false" truevalue="-name" falsevalue="" label="Use the “name” column in the BED file for the FASTA headers in the output FASTA file" /> | 23 <param name="name" type="boolean" checked="false" truevalue="-name" falsevalue="" |
22 <param name="tab" type="boolean" checked="false" truevalue="-tab" falsevalue="" label="Report extract sequences in a tab-delimited format instead of in FASTA format" /> | 24 label="Use the 'name' column in the BED file for the FASTA headers in the output FASTA file" |
23 <param name="strand" type="boolean" checked="false" truevalue="-s" falsevalue="" label="Force strandedness" help="If the feature occupies the antisense strand, the sequence will be reverse complemented." /> | 25 help="(-name)" /> |
24 <param name="split" type="boolean" checked="false" truevalue="-split" falsevalue="" label="Given BED12 input, extract and concatenate the sequences from the BED 'blocks' (e.g., exons)" /> | 26 <param name="tab" type="boolean" checked="false" truevalue="-tab" falsevalue="" |
27 label="Report extract sequences in a tab-delimited format instead of in FASTA format" | |
28 help="(-tab)" /> | |
29 <param name="strand" type="boolean" checked="false" truevalue="-s" falsevalue="" | |
30 label="Force strandedness" | |
31 help="If the feature occupies the antisense strand, the sequence will be reverse complemented. (-s)" /> | |
32 <expand macro="split" /> | |
25 </inputs> | 33 </inputs> |
26 <outputs> | 34 <outputs> |
27 <data format="fasta" name="output" /> | 35 <data format="fasta" name="output"> |
36 <change_format> | |
37 <when input="tab" value="-tab" format="tabular" /> | |
38 </change_format> | |
39 </data> | |
28 </outputs> | 40 </outputs> |
41 <tests> | |
42 <test> | |
43 <param name="input" value="nucBed1.bed" ftype="bed" /> | |
44 <param name="fasta" value="nucBed1.fasta" ftype="fasta" /> | |
45 <param name="tab" value="False" /> | |
46 <param name="split" value="False" /> | |
47 <output name="output" file="getfastaBed_result1.bed" ftype="fasta" /> | |
48 </test> | |
49 <test> | |
50 <param name="input" value="nucBed1.bed" ftype="bed" /> | |
51 <param name="fasta" value="nucBed1.fasta" ftype="fasta" /> | |
52 <param name="tab" value="True" /> | |
53 <param name="split" value="False" /> | |
54 <output name="output" file="getfastaBed_result2.tabular" ftype="tabular" /> | |
55 </test> | |
56 </tests> | |
29 <help> | 57 <help> |
58 <![CDATA[ | |
30 **What it does** | 59 **What it does** |
31 | 60 |
32 bedtools getfasta will extract the sequence defined by the coordinates in a BED interval and create a new FASTA entry in the output file for each extracted sequence. By default, the FASTA header for each extracted sequence will be formatted as follows: “<chrom>:<start>-<end>”. | 61 bedtools getfasta will extract the sequence defined by the coordinates in a BED interval and create a new FASTA entry in the output file for each extracted sequence. By default, the FASTA header for each extracted sequence will be formatted as follows: “>chrom>:<start>-<end>”. |
33 | 62 |
34 .. image:: $PATH_TO_IMAGES/getfasta-glyph.png | 63 .. image:: $PATH_TO_IMAGES/getfasta-glyph.png |
35 | 64 |
36 .. class:: warningmark | 65 .. class:: warningmark |
37 | 66 |
38 1. The headers in the input FASTA file must exactly match the chromosome column in the BED file. | 67 1. The headers in the input FASTA file must exactly match the chromosome column in the BED file. |
39 | 68 |
40 2. You can use the UNIX fold command to set the line width of the FASTA output. For example, fold -w 60 will make each line of the FASTA file have at most 60 nucleotides for easy viewing. | 69 2. You can use the UNIX fold command to set the line width of the FASTA output. For example, fold -w 60 will make each line of the FASTA file have at most 60 nucleotides for easy viewing. |
41 | 70 |
42 @REFERENCES@ | 71 @REFERENCES@ |
72 ]]> | |
43 </help> | 73 </help> |
44 <expand macro="citations" /> | 74 <expand macro="citations" /> |
45 </tool> | 75 </tool> |