# HG changeset patch # User xuebing # Date 1331921697 14400 # Node ID 6bd2945ec360ef4485b13d49963ef7885bfbdb86 # Parent aa8bed8ca1e38688da6a80cdf38641fb3fc5fb4d Uploaded diff -r aa8bed8ca1e3 -r 6bd2945ec360 match.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/match.xml Fri Mar 16 14:14:57 2012 -0400 @@ -0,0 +1,54 @@ + + find short motif occurrences + ./match $motif $seq $output $nmismatch $rc $bed > $log + + + + + + + + + + + + + + +**What it does** + +This tool searches occurrences of a short nucleotide seuqences (allowing mismatches) in a set of longer sequences. + +Example motif file:: + + >motif1 + CAGGTAAGT + >motif2 + GTTTGGGGGCC + +Example sequence file:: + + >hg18_chr6_122208322_122209078_+ + CGTCGTAGCTACTAGCTACGTACGTACGTAGCTAGCATGCATGCTACGTA + CGTAGCTAGCTAAAAAAAAAAAAAAACTGCGGCTAGCTAGCTAGCTACGT + CGATCGTAGCTAC... + >hg18_chr6_1208322_122209023_+ + CGATGCTAGCTAGCTAGCTACGTAGCTAGCTAGTCGATGCTAGCTAGCTA + ATGCTAGCTAGC.... + +Output (bed):: + + chr11 72790893 72790902 ACTTAACTG 1 - antisense 5ss,G4T:CAGTTAAGT-rc hg18_chr11_72790846_72791902_+ 47 + chr11 72791880 72791889 CAGGTAAGA 1 + sense 5ss,T9A:CAGGTAAGA hg18_chr11_72790846_72791902_+ 1034 + + +Output (tab):: + + Tmod4 802 5ss:CAGGTAAGT-rc ACTTACCTG + Atp7b 77 5ss:CAGGTAAGT CAGGTAAGT + Fnta 665 5ss:CAGGTAAGT CAGGTAAGT + + + + +