# HG changeset patch # User iuc # Date 1752528788 0 # Node ID 7653ebd919bbdb9c7b710bdb947d9e400db154bd planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/meme commit 89ee0af6e955ff964b7984d77ad536e0a9154278 diff -r 000000000000 -r 7653ebd919bb all_fasta.loc.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/all_fasta.loc.sample Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,18 @@ +#This file lists the locations and dbkeys of all the fasta files +#under the "genome" directory (a directory that contains a directory +#for each build). The script extract_fasta.py will generate the file +#all_fasta.loc. This file has the format (white space characters are +#TAB characters): +# +# +# +#So, all_fasta.loc could look something like this: +# +#apiMel3 apiMel3 Honeybee (Apis mellifera): apiMel3 /path/to/genome/apiMel3/apiMel3.fa +#hg19canon hg19 Human (Homo sapiens): hg19 Canonical /path/to/genome/hg19/hg19canon.fa +#hg19full hg19 Human (Homo sapiens): hg19 Full /path/to/genome/hg19/hg19full.fa +# +#Your all_fasta.loc file should contain an entry for each individual +#fasta file. So there will be multiple fasta files for each build, +#such as with hg19 above. +# diff -r 000000000000 -r 7653ebd919bb macros.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/macros.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,18 @@ + + 0 + 5.5.8 + 23.0 + + + meme + + + + &2 echo "this tool is only available for non commercial use"; + exit 1; + #end if + ]]> + + diff -r 000000000000 -r 7653ebd919bb streme.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/streme.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,162 @@ + + Simple, Thorough, Rapid, Enriched Motif Elicitation + + macros.xml + + + streme + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + value is not None and value > 0 + + + + + + + + + + + + value == True + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + 10.1093/bioinformatics/btr261 + + \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/alphabet.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/alphabet.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,13 @@ +ALPHABET "DNA with covalent modifications" DNA-LIKE + +# Core uppercase symbols +A "Adenine" 8510A8 ~ T "Thymine" A89610 +C "Cytosine" A50026 ~ G "Guanine" 313695 + +# Covalent modifications +m "5-Methylcytosine" D73027 ~ 1 "Guanine:5-Methylcytosine" 4575B4 +h "5-Hydroxymethylcytosine" F46D43 ~ 2 "Guanine:5-Hydroxymethylcytosine" 74ADD1 +f "5-Formylcytosine" FDAE61 ~ 3 "Guanine:5-Formylcytosine" ABD9E9 +c "5-Carboxylcytosine" FEE090 ~ 4 "Guanine:5-Carboxylcytosine" E0F3F8 +a "N6-methyladenine" 8510A8 ~ t "Thymine_lowercase" 756BB1 +g "modified_g" 00897B ~ 5 "cytosine_lowercase" 53698A diff -r 000000000000 -r 7653ebd919bb test-data/dreme_fimo_input_1.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/dreme_fimo_input_1.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,99 @@ + + + dreme -oc dreme_out -norc -p input.fa + + + + + + + + + + + + + + + + + + + + given + + + 100 + 0.01 + 1 + ThinkPad-T450s + Wed May 02 16:45:34 CEST 2018 + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 7653ebd919bb test-data/dreme_test_sites.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/dreme_test_sites.fa Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,2000 @@ +>U2AF2_K562_rep02_1 +UCUACACAUAGGGUGUUCCUGAAAAGCCCCAUAGUGAUUGAGUCUUCAAAACCACCGAUUC +>U2AF2_K562_rep02_2 +UUGGAUAGCGGAAGCCCUGACCAGGCAUGGAGUAUCUCACAAAGUAGACGAUUCCUCUGGG +>U2AF2_K562_rep02_3 +GGUUUCGGUCUAAGUACCACCCAGAUGAGGUGGGGAAGCGUCGGCAGGAGGCCCGGGGGGC +>U2AF2_K562_rep02_4 +AAACAGGGUUUGUGGAUGCACUUAGAUGUUUGCAAUGAGCACUGUGGCUGGCAUGCCCCAG +>U2AF2_K562_rep02_5 +UCCCAUUGUUUCUGCAGAGGCAGUUGGUGUCACCAGCCAGCGACCAGUGUUUUGUCCUUUU +>U2AF2_K562_rep02_6 +UUCUACCCUCUCUAACUCCUCCCAGCAGCAAAAGGGAGACACUUCAGCUGGAACAAAAUAG +>U2AF2_K562_rep02_7 +UUCUACCCUCUCUAACUCCUCCCAGCAGCAAAAGGGAGACACUUCAGCUGGAACAAAAUAG +>U2AF2_K562_rep02_8 +UUUUCUCCCUUCCACCCACACCCUGCAGCGUCGAGGUCCUCAGCGAUCAGUUGAUGUAAUA +>U2AF2_K562_rep02_9 +GGCAGGGGAAGUGGGGAUGGCAGGACAUGGAUGGCCCUUGAGGCAUUGGCUCUGGGUGUCA +>U2AF2_K562_rep02_10 +GCAGGGGAAGUGGGGAUGGCAGGACAUGGAUGGCCCUUGAGGCAUUGGCUCUGGGUGUCAU +>U2AF2_K562_rep02_11 +UUAGUCUUUCCAUCUACAGCCCACUGGCACUCCAGGCACCUACCUACUUCAAACAAGCUCA +>U2AF2_K562_rep02_12 +UUUCUCUUUUCCUUCCACAGGGGACCGUGAUUAGGGUAUUUUCCAUUCCAGAAGGACAAAA +>U2AF2_K562_rep02_13 +AUAACUGUUUUGUCUUUCCCUCCCCCGCUUCGUUCCCAGGUUUCGGUCUAAGUACCACCCA +>U2AF2_K562_rep02_14 +UUUCAGAGAACGUUUGUCUGCCUGAUGAGAGCCACUUGGGUUAAGAAACUACCUGUGAAUA +>U2AF2_K562_rep02_15 +AUGCUUUGCAAUUGCAGCUCCUUUAUGUCUCCAAAUGAUACAAGAAGACCCGAGAAAGUGG +>U2AF2_K562_rep02_16 +UUUGCAAUUUUGCCUAGGGCCCUGGUGGUGGCAACCGCCUGUGUGCCACUGAAAAUCGUGC +>U2AF2_K562_rep02_17 +UUGCAAUUUUGCCUAGGGCCCUGGUGGUGGCAACCGCCUGUGUGCCACUGAAAAUCGUGCC +>U2AF2_K562_rep02_18 +CUAAUUUUUAAAAAGCAGCCUCUGGAGCCAGCCAUGUUUGGCACUGAAUCUUCAUGUAAGU +>U2AF2_K562_rep02_19 +UCUAAUUUUUAAAAAGCAGCCUCUGGAGCCAGCCAUGUUUGGCACUGAAUCUUCAUGUAAG +>U2AF2_K562_rep02_20 +UUUCUGUCUUCUCCUCUCUUCCUUUACACAAACUUAAACAGAAUGGAAAUGAAAACCAAGG +>U2AF2_K562_rep02_21 +AAACAGUUUCAGCUCCUGGCAUCAGCUCUAUUCAAAUCUGGUUCAGAUUUUACAGCUCUGG +>U2AF2_K562_rep02_22 +UUCUCUCUCUUCCCCUGGCUCCCUCAAGGUGAACAGCCAUAUACCAGGAAUAGGAUACCAG +>U2AF2_K562_rep02_23 +UAUAUCCUUAGUGCAGGCUGUGGAAGAACAGGUGCCAUUUGUGCCAUAGAUUAUACGUGGA +>U2AF2_K562_rep02_24 +UCCCUAAUUCUUCACCUCCCCCUCCUCUGCUGCCUCCUUGCUCUCCUCGCAGGUCAAGUUU +>U2AF2_K562_rep02_25 +AUUGUUACUCCCAGGUGCCUUCGAAACAUCUGCAAGUUUUUAGUCUUGCUCAUCCCACUCU +>U2AF2_K562_rep02_26 +CACAUUUUUUAAAAGGGCAAGUACAGGAGCAACUGCUGCUACCCAGAAAAAUGUGUGUAUU +>U2AF2_K562_rep02_27 +CACAUUUUUUAAAAGGGCAAGUACAGGAGCAACUGCUGCUACCCAGAAAAAUGUGUGUAUU +>U2AF2_K562_rep02_28 +AUUCCGUAGGUUCUAAUCUGUUCUCCCUCCUCCUCAACGUAAGUACACAGUGGAUACCCUC +>U2AF2_K562_rep02_29 +UAUUCCGUAGGUUCUAAUCUGUUCUCCCUCCUCCUCAACGUAAGUACACAGUGGAUACCCU +>U2AF2_K562_rep02_30 +ACUAAAGUUUUUUUUCCUAGUGGUUAUCAUGAGACUUAUAUAAAACAUGUUGUAUCUUAAC +>U2AF2_K562_rep02_31 +CCUCCUCUUUCUCCCUCCCUCCUUCAUUCCCUCCAUCCCUCUCUUAACAGCUUGAAGAUAA +>U2AF2_K562_rep02_32 +CCUCCUCUUUCUCCCUCCCUCCUUCAUUCCCUCCAUCCCUCUCUUAACAGCUUGAAGAUAA +>U2AF2_K562_rep02_35 +AUUUAUCCUCUUGCUUUUGCAUCUCAAAAUUUUAUCGCCUUGAAGACACGUUUCUAUGAAU +>U2AF2_K562_rep02_36 +GUCAGAAGGUAGCAGGGGCUGGGGGUUGCAGGGGGAUGUUGAGAAGAAGUGGUCCUUUGGU +>U2AF2_K562_rep02_37 +AGUCAGAAGGUAGCAGGGGCUGGGGGUUGCAGGGGGAUGUUGAGAAGAAGUGGUCCUUUGG +>U2AF2_K562_rep02_38 +UUGCUUCUCCUUUCUUCCUUCCUUCCUGCCCAGGGCCUCAUCUUUGUGGUGGACAGUAAUG +>U2AF2_K562_rep02_39 +UAGAGACUGUUUAUUUGUUUGGUGGCUGGGAUGGAACACAAGAUCUUGCUGACUUCUGGGC +>U2AF2_K562_rep02_40 +CUUAGGUAUGCCGAGCAGACAGCUGGAGGAUCCCGGGGCAGGGACACCUAGCCCGGUGCGU +>U2AF2_K562_rep02_41 +AUUCUCCUGGGUUUUUGGCAGAUGGUUGCAGUGGCAGGACCAAGGCCUAGUGAGCUAUAGC +>U2AF2_K562_rep02_42 +GCAGAUGGUUGCAGUGGCAGGACCAAGGCCUAGUGAGCUAUAGCUAAAUCUACAGUGGGAU +>U2AF2_K562_rep02_43 +CCCCGUGCCUUGCCUCCCCAGGCGUGUGACCCCCUGCCGCACGAGGAGGAGCCCUCUGAAG +>U2AF2_K562_rep02_44 +UUUACCCCACUACUAGGUAAGGGGCCUGGAUACCAAGAAGUGACUGCUCAUCUAAUCCAUA +>U2AF2_K562_rep02_45 +GAUGGUCAUUGUCCUCCAGAGCAGUGAUGGAGGAAAUACCAGCCCAGGAAGCAGCAGGGUC +>U2AF2_K562_rep02_46 +AUGGUCAUUGUCCUCCAGAGCAGUGAUGGAGGAAAUACCAGCCCAGGAAGCAGCAGGGUCA +>U2AF2_K562_rep02_47 +UAGGCCUGUGAGGCUGCCACACCCUGUGCCCCCGUGCCUUGCCUCCCCAGGCGUGUGACCC +>U2AF2_K562_rep02_48 +CAGGUCUCUCCUUACGGGGCCAGGGCAAUUUCUUUUCGUUCUUGCCCGUGUUGAACUGGGC +>U2AF2_K562_rep02_49 +UACUUCUCUUUCCCUGUCCCCAAAGCAGAUCGCCAAACUGAGGCAGCAACUACAACGCAGU +>U2AF2_K562_rep02_50 +GGCGUGUGACCCCCUGCCGCACGAGGAGGAGCCCUCUGAAGUGCCACAGCUGCGCCAGCCC +>U2AF2_K562_rep02_51 +GUGGGCAGUGGGCGAGCCAGGCUGGGGGUUGUGGGGGAGGCCUGGGUUGCAGGUUUAAGCG +>U2AF2_K562_rep02_52 +AAGUUCCACUCUUGUCCUGGGGACCCAGCUUUAACUUUAGCAUCUGGUAUGUUGAACUUAG +>U2AF2_K562_rep02_53 +UCACUCCUUCUCUUUCCUAAGACUGACUUUAUGGCCUUUCACCAAGAACAUGAAGUGCGUA +>U2AF2_K562_rep02_54 +GAGCGCAGCAAGACAGAUUAGGGGAAGGGGAGAGGAGAGACUUGGCUAGCAAAGGUCUUGU +>U2AF2_K562_rep02_55 +GGAGCGCAGCAAGACAGAUUAGGGGAAGGGGAGAGGAGAGACUUGGCUAGCAAAGGUCUUG +>U2AF2_K562_rep02_56 +CUUUCUCUUUCUCUCUUUCUCUCUCUUUCUGUCUGUCUGUCUGUCUUUCUGUCUUUCUUUC +>U2AF2_K562_rep02_57 +UGUUCUGCUUUCCUCCUUAGGCCAGGUGCUGUGUGUGCUGCCGUCUGUCUGUAUUUUCUUC +>U2AF2_K562_rep02_58 +GUGACCAGUUCUUUUGCAGGAAAUUGUUUCUGAGAAGACUGGAAGACAAGAAAUAUCCCAC +>U2AF2_K562_rep02_59 +UCUAUAUUACAGGAGAUACAACUCGUCAACGAAUCAAAUUCAGUGAUGACAGAGUAUGCAA +>U2AF2_K562_rep02_60 +UCUAUAUUACAGGAGAUACAACUCGUCAACGAAUCAAAUUCAGUGAUGACAGAGUAUGCAA +>U2AF2_K562_rep02_62 +GUAACAGAGUAAGCAGGAAAUUCACAGGAGGUCUGCUCGGCUCAGAAACACUAAAUACAAA +>U2AF2_K562_rep02_63 +GUCCUUUUCUCUGAGGAUGUGCUGCCUAGUGUCGUGGAAUCUGCCUGACCAUUGCAAGCAU +>U2AF2_K562_rep02_64 +UUCCCCAUUCCAGAUCCUGGGUGUUUGGCUGACCUACAGAUACAGGAACCAGAAAGACCCC +>U2AF2_K562_rep02_65 +AUUAACAUAAUGAACCAUAUUCAUUUCUUGGUCAGUUGUGAGCCAUUCUUUUAUUCCACUU +>U2AF2_K562_rep02_66 +AUUAACAUAAUGAACCAUAUUCAUUUCUUGGUCAGUUGUGAGCCAUUCUUUUAUUCCACUU +>U2AF2_K562_rep02_67 +CUUUUUCUUUCCUGUAUCCUUUUUAGGUUUCUAGCCAUCCAUGAGAAGGAAGUUAAUGAAA +>U2AF2_K562_rep02_68 +UUCUUUACAGGGAACACUGAAAGGUUUUGACCAGACCAUUAAUUUGAUUUUGGAUGAAAGC +>U2AF2_K562_rep02_69 +CCUCUUUUACCUAAUAGGUGGCCAGCAUCGAAAUGUUCAGCCUUUUAGUGAUGAAGAUGCA +>U2AF2_K562_rep02_70 +UUGCUUUUCACAGGCGUGGGAUCCAGGAUGGUGUCCUCUGUGAGGACUUGAACUCUGGGGC +>U2AF2_K562_rep02_71 +UUAUUCUCUCUUUCUGCAGAUGGGCUUUCUCCACAUGAUGGAGAAGAUGGCUGCCAGGUAC +>U2AF2_K562_rep02_73 +CAUUCCAUCAUCAAAGGUAUUGAUAACAGAACAUGGCGACUUGGGAAAUGGAAAGUUUUUG +>U2AF2_K562_rep02_74 +UCUCUAAAUUUUUCCCCCUACUUUCUUGCUUCUGUUUCACAUUUUUUAAAAGGGCAAGUAC +>U2AF2_K562_rep02_75 +UCUCUAAAUUUUUCCCCCUACUUUCUUGCUUCUGUUUCACAUUUUUUAAAAGGGCAAGUAC +>U2AF2_K562_rep02_76 +UUUUCAGAUUACUGAGAGUCUUCAGUUACUAGGUAAGUCGCCCCAUCCUUAUUACUCCAGG +>U2AF2_K562_rep02_77 +UUUCAGAUUACUGAGAGUCUUCAGUUACUAGGUAAGUCGCCCCAUCCUUAUUACUCCAGGU +>U2AF2_K562_rep02_80 +GCACGUGCUUUGCCCUGGGUACAGCCAGAGCCCUUCAACCCCACCUUGGACUUGAGGACCU +>U2AF2_K562_rep02_81 +AGAGGACGAAAACGAAGCUUCGUUCCUGAGGAAGAAAAACAUGAGGUUGGAAUAAGUUAAG +>U2AF2_K562_rep02_82 +UUUUUUUCCAGAGAACCAGAGGACGAAAACGAAGCUUCGUUCCUGAGGAAGAAAAACAUGA +>U2AF2_K562_rep02_86 +GGUCUAUGGUACCGUUGCUUCAGGUGAUAUCCAGGGGUUCUCCUAUGUCUUUUGAAGAUUC +>U2AF2_K562_rep02_87 +UUCUUCUCCCCUUUUUGCCCAGUUAAUCCAUAUUCAUCUGCAGAUAUGUUACCCAUGUUAC +>U2AF2_K562_rep02_88 +UUUUUGUUUUUUCCACAGAUUCCUAGAUAGGGUUGUUCAUCUGUCAUCUUAAAAGGGUUUU +>U2AF2_K562_rep02_89 +UUCUCUCUCUCUCUACAGAAUGGUCCUAGUGCCAGAUCGUGUCAUAAAAUGUGCAUUGAUA +>U2AF2_K562_rep02_90 +UUUUUGUUUUUUUUUUUGUUUUUUUCCAGAGAACCAGAGGACGAAAACGAAGCUUCGUUCC +>U2AF2_K562_rep02_92 +UUUUUUUUCUUCUGUCCUUUUGUGUGUGUCCUUCCCUCUCAUCGUUGGCCACUCAUAGAUA +>U2AF2_K562_rep02_93 +UCUUGUGUAGGUUUUUCCGUCGUGGCUGGGUGACCUUCGACCGCAGUGUUAACAUUAAAGA +>U2AF2_K562_rep02_94 +CAGUUUCUACAGACUGCCAUUGCUAUGCACGGCUGAGAUGGACAGAGUUUGCUUGUGAAUC +>U2AF2_K562_rep02_95 +AAUUUAUUUCAAAGGAUGCGAAGUACAAAACUGCUUCGGCUCAUUGACUUAGAUUUUUCAU +>U2AF2_K562_rep02_100 +UUUUCAUUUCCUUCAGAGGGCAGAGGUGGCUCAGAGAGAGGCGGAGACCUUAAGGGAACAG +>U2AF2_K562_rep02_103 +CUACAGUGUUCUCAUUCCUCAGAGCAGCCAGGAUGUGUUAUUUCAGGAGUUUGUGACAUUC +>U2AF2_K562_rep02_104 +CUACAGUGUUCUCAUUCCUCAGAGCAGCCAGGAUGUGUUAUUUCAGGAGUUUGUGACAUUC +>U2AF2_K562_rep02_105 +UAGCGAUAGGGUCUCACCAUGUUGCCCAGGCUGGUCUUGAACUCCUGGACUCAUCCUAAAG +>U2AF2_K562_rep02_106 +AGCGAUAGGGUCUCACCAUGUUGCCCAGGCUGGUCUUGAACUCCUGGACUCAUCCUAAAGU +>U2AF2_K562_rep02_109 +CUUGUUUCUUCCUAAGUAUAAGGUCUCUGAGAAGGUCUGUAGAGUGUGGCUUAGAUUCCAG +>U2AF2_K562_rep02_110 +UUGUUUCUUCCUAAGUAUAAGGUCUCUGAGAAGGUCUGUAGAGUGUGGCUUAGAUUCCAGG +>U2AF2_K562_rep02_111 +AAGUGGUCCUUUGGUCAGGGUGGGAAGCCAACAGGAUUUCCUGGUGCAUUGGAGGUGAAAG +>U2AF2_K562_rep02_112 +GAAGUGGUCCUUUGGUCAGGGUGGGAAGCCAACAGGAUUUCCUGGUGCAUUGGAGGUGAAA +>U2AF2_K562_rep02_116 +GACAGCCAGGUACCAGGUGAGCUGAGGAACCCUCUGCUUUUCCUCAGGGACUAUUGCUACU +>U2AF2_K562_rep02_117 +ACAGCCAGGUACCAGGUGAGCUGAGGAACCCUCUGCUUUUCCUCAGGGACUAUUGCUACUG +>U2AF2_K562_rep02_118 +UCAUUCCCUGCUCUAUCCCCAGGCCCAGGGCACUGCCUGAUGCAUGGUAGCACUUAUAAAU +>U2AF2_K562_rep02_119 +CUUUUUAGCUCCUUGUUUAGUCAUUCACUAAUUUCCAUACAUGAUAACGAAUUCUUCGGUG +>U2AF2_K562_rep02_121 +UUUUCUCUAUUCCAGUGGCCCUUUCUCUGCAGCUGGGCCCCACACCUACAUCCAUCCGUUU +>U2AF2_K562_rep02_122 +GCUAUGACUUCACACCUAUGGAUUCUUCUGCAGUUUAUGUGUUAAGUAGUAUGGCUCGCCA +>U2AF2_K562_rep02_123 +UUUUUGUUUUGGUGGCAGGGGAUAGGGUCUCCCUCUGUCUCCCAGGCUGGAGUGCAAUGGU +>U2AF2_K562_rep02_126 +AGGGGCAGGACAGAGCCCUUUCCUAGGGAAGCCCGGCACCCCCUGCUGUCCAGGGAAGGGG +>U2AF2_K562_rep02_127 +GAAGACCGAGGCGGUUUCAGGGGAUUGUCCCCUCCAGGGUCUGCUACACUGUCUGAAGGAG +>U2AF2_K562_rep02_128 +GGAUACCCUCUCUAUGAUCUUCAUUCUCUGGCCAUGGUGCUACAGUGUUCUCAUUCCUCAG +>U2AF2_K562_rep02_129 +GGAUACCCUCUCUAUGAUCUUCAUUCUCUGGCCAUGGUGCUACAGUGUUCUCAUUCCUCAG +>U2AF2_K562_rep02_130 +AGUGGGAGUGCGGAGGGGCUCCCGAGGGGGCUCCUGGGCCUGGUUUGAGAGAGGCCAAGAA +>U2AF2_K562_rep02_131 +AGUGGGAGUGCGGAGGGGCUCCCGAGGGGGCUCCUGGGCCUGGUUUGAGAGAGGCCAAGAA +>U2AF2_K562_rep02_132 +UUGUGUUAUUGCUUCCAGGUCAGGGGUCACCACAUUGCAAAACUUGAUCCUCUCGGAAUUA +>U2AF2_K562_rep02_133 +GUUUUCUGGUAUUUUCUAGCAUCCUUCUCACCACAGCCAUAACCCUUUUUUACUUCCAUUA +>U2AF2_K562_rep02_134 +UCUCUUUUUGCUCACCUGGGGAGUUCCUUCCCCUUUCCAUAAACUGUGGUCCCUGCAUGGC +>U2AF2_K562_rep02_138 +CACCAAUCACACUUUCGCAGUGGAGAAAGUGCUGUGACUUUCCUCGCCAGGCGCCUCCCUC +>U2AF2_K562_rep02_139 +GUUUAUCAGCCAUAGGUUGGAGGCAACAGCUGGAAAUGGCUCUUCCCCUUCAAGGUUGUAG +>U2AF2_K562_rep02_140 +UCCACUUGCAUUCAUUCUCCACUGGCCCUCCGUAUCCACAGAUUCCCGCAACCAACUGUAU +>U2AF2_K562_rep02_147 +UGUCAUUUUUUCCUUUUCCAGGCAUCCUUGUUCAUCUAGCAAUAUCUGAACUGCAGUGCAU +>U2AF2_K562_rep02_149 +CUGUUAUAGUGUGACUGUUGCUUUUUUGUCUCCUUUUCUUUUAAACAGGGUUUGUGGAUGC +>U2AF2_K562_rep02_150 +UUUUUUCUAGAGAUGGUUUCUACCCCGACUGUUUCCCAGGCUGGUCUGAACUCCUGGUCUC +>U2AF2_K562_rep02_151 +UUUUUCUAGAGAUGGUUUCUACCCCGACUGUUUCCCAGGCUGGUCUGAACUCCUGGUCUCA +>U2AF2_K562_rep02_158 +UUGAUUUUGGUUCAUCUCUUUUUAGGUCUGAUGCCUGGAGGGAGGGUCAAGCUGGUACAUA +>U2AF2_K562_rep02_159 +UUCUUUUUGUCUACCCAUCUCCCUUCAGUCUUAAUAAAAGGUCUUAAACAGUUACAUGAGA +>U2AF2_K562_rep02_165 +ACCAUUUUUUUCAGGUGAUUGAAGCAGAGCAUAUAUGAUCUCCACAUAUCAAGACUAACGG +>U2AF2_K562_rep02_166 +CAAUUUCUGUGACUGUCAACCCUCUUGUGUCCUCCUAACCUCCUUCCUCAGCUUGCAUGGA +>U2AF2_K562_rep02_169 +CCAUCACCUCUCAACCUUUGCUUCGACAGGUCUUCACUCACGAUUUAUUCCUCCAGGUCUU +>U2AF2_K562_rep02_170 +AGGCUGGGAGGCAGGGCUGAGAGGUGGCCGAGAGAGAGGAGUCGCAGAGCCGCCAGAGUGA +>U2AF2_K562_rep02_171 +ACCUUUUUUUCUUCCCAGCCUCAGGUAUGAAUCAGCAGCAUGAAAAUGGAUUUGAAUACAG +>U2AF2_K562_rep02_179 +CAUGUUCCAGCCUUGCCUUUAGGAAGGGAGGACGUUCCGACCAGCCCGUUGUUCAGGGUGG +>U2AF2_K562_rep02_180 +UGCUCAUCCCACUCUUCCUUUUACUAGGUAAGUCAAAUCUGGCUGAGUUGCCUCCGAUGGC +>U2AF2_K562_rep02_181 +CUGUUGGCCAGUUUGCUGGGGGAAGCGGGCCAGGAACCAGCCCUGGCAGAAGUGUUCCACC +>U2AF2_K562_rep02_182 +CUGUUGGCCAGUUUGCUGGGGGAAGCGGGCCAGGAACCAGCCCUGGCAGAAGUGUUCCACC +>U2AF2_K562_rep02_183 +CUUUUUCUUUUAUAUGGGGGGCCGCAAAGGCGUCGACAUUCCAGAUGGCUAUCCUGCUUCA +>U2AF2_K562_rep02_184 +UCCCUCUUUCCCGACAGCAGCUGCGGCAAGAGAGCCCUGCCCUCUCCGAGGCCUGCUCAGC +>U2AF2_K562_rep02_185 +CUUCCUGUUUCUCUCCCAUAGGAGAGGGCUGAACCCCCCUCAUCGUGUCAAGUCAAUCUCC +>U2AF2_K562_rep02_186 +GACUAUUGCUACUGAUGGAGUGUGGCCUCUCUCUCAUCCCAUCUGUAGACCUUGCCUGGAA +>U2AF2_K562_rep02_187 +GACUAUUGCUACUGAUGGAGUGUGGCCUCUCUCUCAUCCCAUCUGUAGACCUUGCCUGGAA +>U2AF2_K562_rep02_190 +CUUUUUCCCCCAUCCAACAGGCUGUGUGGUUCCGGUGCUGGUGCCGUGGAAGUGGCAAUGG +>U2AF2_K562_rep02_191 +AUCUUCUUCACCAGGCUUUUCUGAUGUGGAUCACACCUAUGCUCAAAGAACUCAGCUCUUU +>U2AF2_K562_rep02_193 +GUUCACUUGGUUUCUAGGUCUAUUCUGGAUAAGCAGGUUUUGUGAAGACAUUUAUUCUUUC +>U2AF2_K562_rep02_194 +GAUAAUAUUAUAUUUCUGAGUGACCAGACGAAAGAGAAGGAGUAGAAAGGAUGAUUCUUCU +>U2AF2_K562_rep02_196 +AUUAUUUCAUUAUCGUUUCUCUGCAACCUUUCUUCAAUGGUACUAAGCAAGACACAUCUGG +>U2AF2_K562_rep02_197 +AAGGCAUGACCUUCCUUUCUCCUUGGCAUAGGCCUUACAACACUGAGGAAAGGCCAUGGUU +>U2AF2_K562_rep02_198 +ACUUCACCAUUCCUUUCAGAAAAAAGGAGAAGAAAAGAACCUACUGAAAACAUUUCUGGUU +>U2AF2_K562_rep02_199 +UUCUCCAGCUGGUUCUUUUCAUUUUACUGCAGAGAUAUUGCCGGAUCAUGACAUAAAAGAU +>U2AF2_K562_rep02_200 +UUUUUUUUUUUUUCCCCUCGUAGGCUAUUAUUCGUGAAUUGGGUGGUAUUCCAAUUGUUGC +>U2AF2_K562_rep02_202 +CCCCCUACAGGCUUUUGUCUUAUUAAGUGAUCUACUUCUCAUCUUUAGCCCUCAGAUGAUU +>U2AF2_K562_rep02_203 +CUUUCCUUCCUUCUUUCCUCUUUUUUUCUUUCCUCCCUCCCUCCCUUUCUUUCUUCCUUCC +>U2AF2_K562_rep02_204 +CUUCUUCCUAGCUGAUAUUCAGCAAUGAGUAUACCCAGGCAGAAAACCAGAAUUGGCACCU +>U2AF2_K562_rep02_205 +CCUUCUUGUCUUCCACAGGUCUAUAGUGAGCGAGAGCUGCUACUUUUUACUUGGGCAUUCA +>U2AF2_K562_rep02_206 +UCUUUCAGCUCUGUGUUCUCGUUUUGCCCAAGACCUUUGGCUAGAGCAGAACAUAAAAGAU +>U2AF2_K562_rep02_207 +UCUCUUGUAACUCCUCAGGCAUUUCUCACAAGAGUGGCAAAGAUACAGCAGGGUGCAUUAG +>U2AF2_K562_rep02_208 +UUCUUUCAUGACCUUUUUUCUUAUUUAGAGAUCCUCCAUAGAUAAUGAAAACCUGGUUUCA +>U2AF2_K562_rep02_210 +UGUGCACACCUCACGGCAAGGGCCAGCCUGUUUCCUCCCGGUCACCUCCAAAUCUUGCUGC +>U2AF2_K562_rep02_211 +UGUGCACACCUCACGGCAAGGGCCAGCCUGUUUCCUCCCGGUCACCUCCAAAUCUUGCUGC +>U2AF2_K562_rep02_212 +UUUUUUUAAGCGUUUGGCAACAUAUUGACUGCAUGGGGAUUGAUAGGCAGCAUAUUCCUGA +>U2AF2_K562_rep02_213 +UUCCUAGGACUAGUAGAUGCUGCAGUCGAUGCAGCACCAGGAGCAGGUGUGUGUAUACCAU +>U2AF2_K562_rep02_214 +UUAUGUAUUGUUUCCCUCUUUGUUUAGCUUGAACAUGCGAAAGUGACACAGACAGAGUUGA +>U2AF2_K562_rep02_220 +UUUAUUUAUUUUCAGAGGGCGCCUCACUCUGUUGCCCAGGCUGGAGUGCAGUGGUGCAAUC +>U2AF2_K562_rep02_221 +AACCUUUGCUUCCACAGACUUUUUCAUCCCUAAGAUACUAGAAGAAGAGCAUACAUAAACG +>U2AF2_K562_rep02_222 +CUUCUUUUCUAGCUACUCUCGGAACCGCACGUUUGACACGUACAUUGGGCAGGGCUACGUG +>U2AF2_K562_rep02_223 +CUUGGGCUUCUUCUUCACAGGGUCUCAUAAGCCAUGGCACAAGACAAGAUUUGAGAGUGGC +>U2AF2_K562_rep02_231 +CUGCUACUCUUAAUCUUCUCUAAAUUUUUCCCCCUACUUUCUUGCUUCUGUUUCACAUUUU +>U2AF2_K562_rep02_232 +GCUGCUACUCUUAAUCUUCUCUAAAUUUUUCCCCCUACUUUCUUGCUUCUGUUUCACAUUU +>U2AF2_K562_rep02_233 +UAUUAUUUCUUAGGACCAGAAGUCCUUGAUGAGGAAGGAACUCAAGAAGACCUAGAGUACA +>U2AF2_K562_rep02_234 +UCCUGCUGACACCCCUUGGGCUGGAGAGGCCUCCUCUGAAAGGGAGCCCUGGGAAAGGGCU +>U2AF2_K562_rep02_235 +GUCCUGCUGACACCCCUUGGGCUGGAGAGGCCUCCUCUGAAAGGGAGCCCUGGGAAAGGGC +>U2AF2_K562_rep02_240 +UUUACUUCCAUUAGGCCGUAUAACUGGAGAGACCUGCUGCUCGUUAUAUAAUUAUCUGAUA +>U2AF2_K562_rep02_241 +UCCUCCCAAGCAGAAAAUAUCCUAGGGGCAAGCCUGUGUAUGAUGUGCCUGUUUCUGUUAU +>U2AF2_K562_rep02_246 +AACUUUUUUGUUUCUUCCUUCUCUAUCCCUUUACUUUAGCUUUUAAGUGAAUUUUGAUUUU +>U2AF2_K562_rep02_247 +UGCUUUAUUUUGGUAGUUGGCGCAGAUCAAGACUCCAUCUGAAAAAAACAAGUGUAUAUAU +>U2AF2_K562_rep02_251 +CUUUUCCCCCAUCCAACAGGCUGUGUGGUUCCAGGUGCUGGUGCCGUGGAAGUGGCAAUGG +>U2AF2_K562_rep02_256 +UAAGUUUCCCUGCCGCAGAGUGAAGCAGAUACGUGUGUGUUGGGGCAUUCGGGGCAUGGAG +>U2AF2_K562_rep02_257 +GAAUUUGGCUUUUUUGCAGGUCCCUAGCUGUUGGUAGUAAGUCCGGUUAUAAAUUUUUCUC +>U2AF2_K562_rep02_258 +CUUUUUCGUUCCAGAGCGCCGCCCUGUGCUGGGCUGCCGGGAGCUCGUCUUCAGGAACCUC +>U2AF2_K562_rep02_269 +AACCCUACAGCCUACCCGUUCCAUCCCGGGCUAUCCCAGUUCCCCACUGCCAGGGAACCCC +>U2AF2_K562_rep02_270 +CUUCCAGAUGAGAUAUCACAGAGGCUUGGGCCUAGAUUGUCAUCAGCAUACUGCUAUACUA +>U2AF2_K562_rep02_271 +UUCACUCCUUGUCACAGUGAGCACAGUAGUGCCACAGGGUCCUGGCGAGGACCUAUGAAGC +>U2AF2_K562_rep02_272 +CUAUUAUUUUACCUAUCCCUUUGUUCCUUUCCUAUUCUCUGUACUUGUAGUCUGACGUGUG +>U2AF2_K562_rep02_282 +UUGUCCCCUUCUCCACCACGUAGGAUCUGAAGAAGCUGAAGAAAAACAGGACAGUGAGAAA +>U2AF2_K562_rep02_285 +CCGUUUAUCUGUAGGAUAUUGGGAGUGUGUGGCAUGCAUCCUCAUCAUCAGGAAACUCUAA +>U2AF2_K562_rep02_286 +ACCCUUUGUCCCCACUUGCUGCCGGGAUGAGAGGUAAGCACGGACCCGCCCACCCUCUGAC +>U2AF2_K562_rep02_293 +GUUUCUCUUCCCUUCCCCCCUUCCCCUGCGGUUGUAGAGCCCGUUCUGUCCGGUCGUGGUU +>U2AF2_K562_rep02_294 +CCUGUUUUUUCUAUUCCUCUUCCUUUUCAAUGGCUUAGGUAUUGCAGUUUCUUAUUUCACA +>U2AF2_K562_rep02_295 +UUAUAAAUUUUUCUCCCUUUCUUCUGUGGAUAAGCUGGAACAGAUCUAUGAAUGCAGUAAG +>U2AF2_K562_rep02_296 +UCUUCUUCCAUUUUUAUUUCCUUCCCCAUUCAGCACCACAUGAAUCAGAAUUUUUUUGAAA +>U2AF2_K562_rep02_297 +CUGUUUCCCUAUUAUUUCCUUACUCUGCUGAACAUGUCCGCUGUUUUACCUCACUGCUCCU +>U2AF2_K562_rep02_298 +CUGUUUCCCUAUUAUUUCCUUACUCUGCUGAACAUGUCCGCUGUUUUACCUCACUGCUCCU +>U2AF2_K562_rep02_299 +UCUUCUUAUUCAGGCAACAUAAGCUUUACAACAAGGAGUUGUAUGCUGACUUCAUUGCUGC +>U2AF2_K562_rep02_300 +UCCAGACCGCUCCUGAGUGGGAGGAGGGGUUCCUGUAGCCGUUGCGUCUUCUCAAACACGG +>U2AF2_K562_rep02_301 +UACAGAGCCAUAAGUGUGAUCCUUGGUGACAGGUGGAAGAAAAUGAAGAAUGAAGAGAGAA +>U2AF2_K562_rep02_302 +UUCUUUUUCUCCUCCCCUGGCAGCAACAGCCAGGCCUGUAGCAGUGCCCUUCGGAAACCAG +>U2AF2_K562_rep02_303 +UUUUCUCACUUUUCCAGUGGUCGUAGCAGGAACAGCGUCUUGACCUCACAUCAGUGACGUG +>U2AF2_K562_rep02_304 +UGGGGAUGUCUGGAAAGGUUGUUGCCGAGGGGGCUGGGCGCAGCCACCCUGUCCCGAGCAG +>U2AF2_K562_rep02_319 +UCACUCUUUUCCCUGACCCUUGGGGCCCAGGGCCAUGGAGGGACCCUUAGGAGUUCAAUGA +>U2AF2_K562_rep02_320 +UCACUCUUUUCCCUGACCCUUGGGGCCCAGGGCCAUGGAGGGACCCUUAGGAGUUCA +>U2AF2_K562_rep02_321 +UCACUCUUUUCCCUGACCCUUGGGGCCCAGGGCCAUGGAGGGACCCUUAGGAGUUCAAUGA +>U2AF2_K562_rep02_322 +AAUGCUCAAAUUGGUUUGGGGGAGCUAUAGGAAACAGUCUCUGAAGAUGCAUAAGGGGCAG +>U2AF2_K562_rep02_323 +UCAUUGUUGAACUCCCACUUUAGCAGAUCACAGAAGAGGAGGUCAGAAAUCUGAAGCACAA +>U2AF2_K562_rep02_324 +ACUCUAAGUUUACUUCUGUUCUCCCUACACUUCCCCACGUAUAUUAUUCGAGUUAAUUUUU +>U2AF2_K562_rep02_325 +UCCUUUACUCUCAUUUCAACUUCCUCCAUAGUAUUGCUGUAAUUAAUCAAAGUAGGCAAAG +>U2AF2_K562_rep02_326 +UUUUCAGUCUUUCCCAUAAAGGUAAUGAAUUUUGGGGCACUACACAAACACUGAAUGUUAA +>U2AF2_K562_rep02_327 +CAAUAGCAGACUCCAGUUUGGGAAUUGAUCCUCUUCGGAGACCUGGACUUCACAUAAACCA +>U2AF2_K562_rep02_328 +UCAAUAGCAGACUCCAGUUUGGGAAUUGAUCCUCUUCGGAGACCUGGACUUCACAUAAACC +>U2AF2_K562_rep02_329 +UUCCUUCUAUCUUUCCCCGUCUUUUCUUCCUUCCUGUAUUGACUUGUUUUGACACAUUUGU +>U2AF2_K562_rep02_345 +CUGCUUCCUUCCCUGACAGGCGGCUGUGGUGCUUCAGGCAGCUUUCAGGGGACAUCUCACG +>U2AF2_K562_rep02_346 +AUAUAUUUUCCCUCCCUUUCUUCCUCCCCUCCCCUCCCUCGCUUCCUUCCUUCCUUCCUUU +>U2AF2_K562_rep02_347 +AUAUAUUUUCCCUCCCUUUCUUCCUCCCCUCCCCUCCCUCGCUUCCUUCCUUCCUUCCUUU +>U2AF2_K562_rep02_348 +CCUUUCUCUUUUUAGCCCCUGGAGGAACGCGCAUAGAUGAUGGUGACAAGACCAAGAUGAC +>U2AF2_K562_rep02_349 +UUAAUUUGUAGUUCCAAUGACAGGAUUUACACAGAGAGCAACUAUUGAUCCAGAACUGAAU +>U2AF2_K562_rep02_350 +UCCUUUCCUCCUCCUUUCUCCCCAUCUCCCUCCACCGCCUUUUUUUGAUUGACCAAGGAUC +>U2AF2_K562_rep02_351 +CUGUUUUAGGAUAUUAGAAAUGGCUACUCCCCAGUCAAUUUUCAUCUUUGCAAUCUGCAUU +>U2AF2_K562_rep02_352 +AAUUUGCUUCUUUCUCCCAUCAGCAUUACCUUGUGGUUUUCUUCUGCAUUUGAGACACAGU +>U2AF2_K562_rep02_365 +CUCAGAAGAGGGUUGGUAGGCCUGGGGGAUGGAUGGGGUUGCUGAAGGCCAUGGCUGAAGC +>U2AF2_K562_rep02_366 +UUUUUUUUCCUUGUCACUAGGUUCCACUAGCACAGUCAGUUUACUUUAGGUUUAUGUCUAA +>U2AF2_K562_rep02_367 +GUGUGGCGGGCAGGGCGGCUCCUGGAGGUGGGAUCUGGGUCAGAGUUACUUCAUGCAUGUC +>U2AF2_K562_rep02_368 +UUCCCAAAUGCUGGAAAAUCCUCUUUGCUAAGUUGUGUUUCUCAUGCAAAACCUGCAAUUG +>U2AF2_K562_rep02_369 +UAGUUAAUAUCUUUGUCCAUACAUCUUUCCAUGCAUCUAUGAUUGUUUCUUUAGGAAUAGA +>U2AF2_K562_rep02_370 +GGGUAACUUUUUUGCCUGUCUCCCAUCCUCCUUUACUCUCAUUUCAACUUCCUCCAUAGUA +>U2AF2_K562_rep02_371 +UUUUCUUGAUAGGACCUUGCUAAGCAGUACUCUGACAGACUAGAAUGCUGUGAAAAUGAAG +>U2AF2_K562_rep02_372 +UUUUAGCUGGAAAGUGAAAUUUCAACCACAGCAGAUGACUGCAGUUCAGAGGUAAGACUAA +>U2AF2_K562_rep02_373 +CUUCAUGUUUUGAGUUGGUUUCUAUUUUCCCUUCAUUUCAGUUAAAUCCUUAAAUAUAAUU +>U2AF2_K562_rep02_374 +UUCAUGUUUUGAGUUGGUUUCUAUUUUCCCUUCAUUUCAGUUAAAUCCUUAAAUAUAAUUU +>U2AF2_K562_rep02_375 +CUCUCCCGCUUGCCUCUGGCAGGAGCUGGGCUGGUGAUGAAGGUCAAGCAGGAGAAGCCGG +>U2AF2_K562_rep02_376 +UUUGUCUGACUUCUUUCACUUUCAGCUUACGAGGAAAUAUUUCAGUAAAAGCAGUUAAAAA +>U2AF2_K562_rep02_377 +CAACACUCUUAUAUACCAAAGUGACCUGAAGGACGGAUGCUGUGUCUUGUUUAUCUGCAUA +>U2AF2_K562_rep02_378 +GUGUCCUUUGCCUGCAGAGACCUGUCUGGGCCGCAGAGAGGAGUCUGGAGGUAGGGUCCAA +>U2AF2_K562_rep02_379 +GUGUCCUUUGCCUGCAGAGACCUGUCUGGGCCGCAGAGAGGAGUCUGGAGGUAGGGUCCAA +>U2AF2_K562_rep02_380 +CUCGUUUUCUUUUUUAGGCCUGAUCAACCCCGUAUAACCAAAGAUGUAAUUUGUUUUCAUG +>U2AF2_K562_rep02_399 +CUUCAUUGAUAGCUAACUUCUCCUUUGCCACUUACUGAACGGUCUGAUCUCUGGAGAAUUC +>U2AF2_K562_rep02_400 +UACAGUACGGGGUGGACGUGAGGAGCCGGGACGCCCGGGGCCUGACUCCACUGGCAUAUGC +>U2AF2_K562_rep02_401 +AUUUCUCUGAAUUUCUAGAUAUACACCUGAAGAAAUUGAGAAGCUCAAGGAGUAAGUUUUA +>U2AF2_K562_rep02_402 +UUCUCUCUCCUCUCUCUCGUCCUCUACCCCUGCCCCCUGGGUGUUUUUGCAGUUGGUUAGU +>U2AF2_K562_rep02_403 +UUAUUAUCCCUUGUAUGGCAGGAAAGAGUUCCUAGAGAGAGAAGACAAAGACAGUCUGUGU +>U2AF2_K562_rep02_404 +UUAGGUAAUUUCAUCUGUGCCAAAGCCUCCAGAGGACAAGCCAGAAGAUGUACAUACAAGU +>U2AF2_K562_rep02_429 +AUAUCCUUCAUUCUUUAGGCACUGUGAGCCCUGAGAUGUUCAAGAAGAUGUCCAACUCAGA +>U2AF2_K562_rep02_430 +UGUGCAUGUGUGGGUGUGUGUGGGCACAGGUGUGAGUGUGUGAGCAACAGUACCCCAUUCC +>U2AF2_K562_rep02_431 +UGUGCAUGUGUGGGUGUGUGUGGGCACAGGUGUGAGUGUGUGAGCAACAGUACCCCAUUCC +>U2AF2_K562_rep02_432 +CUUUCCCCAGCCUGACAUUUACCCCGGUAACUGCUGGGCAUUUAAAGGCUCCCAGGGGUAC +>U2AF2_K562_rep02_433 +CGUGGGAAGGGAGGCUGGGAGACAGAGGGGACAGUGGCUUCCUGGGUCUGUGAAGACUGAU +>U2AF2_K562_rep02_434 +UUCUGUCUUCCGUUUUCAGCUAAAUUCUGUCCAACGUUUAAUAAAUCAAUGGAGGAACAGG +>U2AF2_K562_rep02_435 +UUAGCUUUGCUCUACAGGUGUUGGAUGACAAGGGCUCGAGCCUCAGCGCCUGUCCUGAUUC +>U2AF2_K562_rep02_436 +ACCUUCCUUCUACCUUUGGGCUUCUGCAUUAGGCUGCUCUUGAAGUGUUUGCCGGGGCCUU +>U2AF2_K562_rep02_437 +UCUCUCCCGCAGCCCACAGAGCAGUUCAACGGGCAGGGCGCCAGCUUCAACGGGGGCAGCG +>U2AF2_K562_rep02_438 +AUUCCUUUUGCUUGUUUCACAGGGGGUUUGAAGAGGACAAAUAAGUUUUUGUUGGUUAAUU +>U2AF2_K562_rep02_439 +UAUUUUUUCCCAGUGCCGACCUCACUUUCCCCACUUGUCCGACCUGCUGCCCAGGCGUCGA +>U2AF2_K562_rep02_440 +CUUCCUGCCCUGGCUCCAUCCUCAGGGGCUCCCUGCAGACAGGGGGGGCCUUCGCCCUGGA +>U2AF2_K562_rep02_441 +UGCCACCCUUUUUUCCUUAGGGUCAAGAAGACUGACUGACAGACCAGGACCCCACCAGGGG +>U2AF2_K562_rep02_442 +UUUCUUUCUAAUCAUUUUUCACCCUUUCUUUAUUUCUUUAAUUGAGUAAUUCCAAGUAAGA +>U2AF2_K562_rep02_443 +CCCUUUUUAUCUCUAGUAACACUUGUCUCUCGCCUCAAAGUCUUCUUAGCUACACCUGCUU +>U2AF2_K562_rep02_444 +CUCCUUUUCUUUUUUAAAAGCUUGGCUACACUGUAACUAACUAGGGUUAAGAGUACCAGUA +>U2AF2_K562_rep02_445 +CUUUGCCCUGUCCGGUUCUGGCAGGUGUGUGGACCCAGGCACUGGGAAGACUCAGCGAGCC +>U2AF2_K562_rep02_2538 +UUUUUCCUUCUUUUCCCACCCCCUCCCCCUCCAUGUGAAGAUUUGGGUGCUUAACAUAUCA +>U2AF2_K562_rep02_2539 +GAUCUGGUUUUCUUCUGGGGCAUUUAUCCGUGCUGAUCUUGGUGAAUGGGGCAUGAGUCUA +>U2AF2_K562_rep02_2540 +ACUAUUUUAGGAAUCUGGAAAACCAGGGGCUCAUGUAACUGUGAAGAAGCUGUUUGUUGGC +>U2AF2_K562_rep02_2542 +AUUUUUCAUUUCGUAGGAGGGAGCAAAGGAGUUUGCUGCUGCUCUCACCGCUGAGCGGAUA +>U2AF2_K562_rep02_2543 +UUUCCCCCCAGAAAACUUUAGAAACUGUUCCUUUGGAGAGGAAAAAGGUACUCUGCCAGCA +>U2AF2_K562_rep02_2544 +GUAUUUUCCUUUGCAGAGAGAAAAGGAACAGUUCCGUAAGCUCUUUAUUGGUGGCUUAAGC +>U2AF2_K562_rep02_2546 +CCCAACCUUUUCUUCUUUCCCAACUUCCCCUUCCUUUCAUAACGUUUUAAGAAAAGUAUAU +>U2AF2_K562_rep02_2547 +GUCUUAUCCACCUUUAGGAUUGGAGAGGGAGAAAGAAAAACUGCUUUGUGUGCCAAAAGCA +>U2AF2_K562_rep02_2548 +UUGCAGCUUUUCAUGCAACACCCAACACUUAUAAGCGGAAGAACACAGAAACAGCUCUAGA +>U2AF2_K562_rep02_2549 +UACAACUGAACUUUUUUUCUUUUUAGUUACUCCACAGGAUCCGCUGAACAUAGGAUGUUGC +>U2AF2_K562_rep02_2550 +UUUUUUUCCUUUGGCAGGAAGGUGUCUUGCUGCAGGUAACUAAUGAAGAAGUGGUCAACCA +>U2AF2_K562_rep02_2551 +UUUGUGUUUUUGCAGGUUGUGGGCUGCACACUGCAGAAAGAUACAGCUGAAAAAGGGUUAG +>U2AF2_K562_rep02_2552 +GUGUUUUUUUCUGUUUGGAUGACUUUUACCCCACCACUAUUUUAGGAAUCUGGAAAACCAG +>U2AF2_K562_rep02_2553 +AUUAUGCAUUUUCUCCCCAGGUCAGCUGGCUGCCUCAUUGCCACCUCCACCUGCAGGAAGG +>U2AF2_K562_rep02_2554 +UCCUGCAGGCAUCUCUAGGUACAACAAAAUACUGCAGUUACUUCUUAAAGAAUAUGCAGUG +>U2AF2_K562_rep02_2555 +UCCCCCUCAGCUUUGUGUCCCUCCUCUAAGGAAAUGGCCCCCGCCAUCGACUGGUUGUCCU +>U2AF2_K562_rep02_2556 +AACAGUUUAUAGUAAACGUAAUCUUUUUUUGGCCCCUAACAGAUGGAUAUGGCAGUGGACG +>U2AF2_K562_rep02_2557 +UUUCCCCUCUUUGAACCAAGCCACUCCUACCUAGGAACUAAAUGGGUAUAUAUUGCCUGUU +>U2AF2_K562_rep02_2558 +UUUGUCUUUCCUCCCUGGGGACCGCUGCCACCCGUGCGGGCCGAAGCCUCGCGAAGCCGUC +>U2AF2_K562_rep02_2559 +UCCUAAUUGCCUCCUUUAUAGCAAAAGAACAUCUUCAUCCUAAAUCUUCUCUCCCAGCAUG +>U2AF2_K562_rep02_2560 +CUUUUUCCUUUACUCCUGGCAGGCUAAUAUUUUUUUAAAGAUUAUACUUCAUAUCUGUGAG +>U2AF2_K562_rep02_2561 +UUUCCAUAUUUCUAGUUCCACAGGAAAGCGAGUGACCUCGCACCUAUAUCCAUAGCAACCA +>U2AF2_K562_rep02_2562 +UACUCCACAGGAUCCGCUGAACAUAGGAUGUUGCCACAAAAUCUACCUCGUGUAUUUUUCU +>U2AF2_K562_rep02_2563 +UUUUUUUUUUUUUUUUUGUUCUUCUCCUUUAGGUGGUAAAUAAAGAUGUCCUGGACGUUUA +>U2AF2_K562_rep02_2564 +CUUCUUUUCCUUUACCCCUCUUCCUCCUGCAGGCAUCUCUAGGUACAACAAAAUACUGCAG +>U2AF2_K562_rep02_2565 +CUCCCUGCUUCUCUCCAGUCUCUCUUGUGCCCAGAUAGACCAGCCAGAGUUUGAUGUUCCC +>U2AF2_K562_rep02_2566 +UUUUUGAGAUAGGGUCUCCCUCUGUCGAACAGGCUGGAAAGUGUAGUGUGUGAUCAUCUUG +>U2AF2_K562_rep02_2568 +AAUCUAGCAUCAUAGCUCCAGCUCCCGCUGAGGAUGUGGAUACUCCUCCAAGGAAAAAGAA +>U2AF2_K562_rep02_2569 +AAGCUUAUAGCUUCAUUGCACCAUGUGUGGCAUUUGGGCGCUGUUUGGCAGUGAUGAUUGC +>U2AF2_K562_rep02_2570 +UUGGAGAGGAAAAAGGUACUCUGCCAGCAGGUCACCUCAUAUUUAAGAAUUUAAUUUCCUG +>U2AF2_K562_rep02_2571 +AUUCACUCUUGAUUCCGCAGGCUGGACAGGAAGCACGGCAGCAUCUACUCGGCUUCUGAGG +>U2AF2_K562_rep02_2572 +UCUUUGUGCCAUUUUCUUUUUUCGAUCUUUCUCAGGUAGGGAAUAAUGAAAUUUGGAUCAU +>U2AF2_K562_rep02_2573 +CAUGCCCACUCUAGGGUUCUGAUCCCACUGCAUUCUCCGUCCUUACCCAAGCCAUCACUGG +>U2AF2_K562_rep02_2575 +UCUCUCAGUUCUUCCAUUACCUUCCCCAGAGGCAAGAAGUUACCAAUUUCUUGGACUUUCA +>U2AF2_K562_rep02_2576 +CCAGCUCGCAGCUUUGCGUGGGCACCCCUUUCCCUGCAGGUGCACCUGGGAACUGGAGACC +>U2AF2_K562_rep02_2577 +UUUCCCUUCCCCAGGCUUUUUCUCCUCCGUGACAGCCAGAGUAAUCCAAAGGCAUUUGUAC +>U2AF2_K562_rep02_2578 +ACCUAAAUUAAAGCUGCCACUGCAGAGCCCCGCCAUGGAAGACACGCCGUUGGUGAUAUCG +>U2AF2_K562_rep02_2580 +UUCUCUUCUUUUUCUCACACCCAAGGGGAAGCCCUUUCCCCUUCCUUCUCUUUUCCUUUUC +>U2AF2_K562_rep02_2584 +AUUUCUUUUCUAGGUCCUACGGGAAGUGAAGGUGCUGGCAGGUCUUCAGCACCCCAAUAUU +>U2AF2_K562_rep02_2585 +UUUUUUUCCCUGCCGGAAUUUUAGCAUUGAUAUGAACCAUGGACAAGUAUAUUCUGCUGCC +>U2AF2_K562_rep02_2586 +GUUCAUCUGUCCCUUUCCAGGGGGAAGACUGUUGCUCUCAAAGAAGUAGGUUUUUGGCUGG +>U2AF2_K562_rep02_2587 +UUCUAGUUGGAGCUCAGCUGCAUGGAAGGCAGCUGCACGUGUUCGUUCCCAACCAGUGAGC +>U2AF2_K562_rep02_2589 +GUCAUUUACUUAAAUUAUUUUGGUUGUUUUUCCCUUUUUUUCCUUCUUUUCCCACCCCCUC +>U2AF2_K562_rep02_2590 +UUUUCUAGCUACUCUCAGAACCGCACGUUUGACACGUACAUUGGGCAGGGCUACGUGAUUC +>U2AF2_K562_rep02_2591 +UCUUUCCUUCCUUCCUCUUCUUUCCUCCCUUAUUUCCAGGGUCUCACCCUGUUGUCCAGGC +>U2AF2_K562_rep02_2592 +UCCUUUUAAUGCCUUCACAGGGUCAGCGCCAAACUGGAGGGGAAUGAAACACUAAAAGUUG +>U2AF2_K562_rep02_2593 +GAUUUUGUCCUUAGUUAUACUUCGAUUAAAACAUGGCUUCAGAGGCUCCUUCCUGUAAUGC +>U2AF2_K562_rep02_2594 +CUUUGAAUUAUGCUUGUGUUUUUUUCUGUUUGGAUGACUUUUACCCCACCACUAUUUUAGG +>U2AF2_K562_rep02_2595 +AGGGGUGAAUGGUGCUGAGGUGCGAGGAGAGGGAAGGACAGUAAAGAGCAGGUGGGCAGGA +>U2AF2_K562_rep02_2596 +UUAUUUCUAUUUCAGACACCAACCAUCUGCCCAGUUGAAGAUUUGCAAAAUAAUUGUUUUU +>U2AF2_K562_rep02_2597 +UCCCCUUUUAUCCAGGGUAGGUCCAGGUAAAGCCAAAGGCCUUAUCCUUAUCUACACUGCU +>U2AF2_K562_rep02_2598 +UGGCUGCCUCAUUGCCACCUCCACCUGCAGGAAGGCCAGAGGUUCUGGUGGAGUUGAUUGA +>U2AF2_K562_rep02_2599 +AGGUGGUAAAUAAAGAUGUCCUGGACGUUUACAUUGAGCAUCGGCUAAUGAUGGAGCAGCG +>U2AF2_K562_rep02_2600 +CCAAUUACAUUAGCAAACUUUGGGGGCUCAAAUGCAAGGUGGUUUUGGAUGUGGCAACCAG +>U2AF2_K562_rep02_2601 +UCUUUUUUCGCUUUUAGGAUGAUCGCUGCAAGAUCCCUUUAUUCAUGCUAAUGUCCUUUAU +>U2AF2_K562_rep02_2602 +AUUUCUCCUCAGAUAACUUCAAGUGAUGUACGAAAAGGUUUGGAGUUCAUUUUUGUGGAAA +>U2AF2_K562_rep02_2603 +UCCCUUUGCCCCUCCCAUUCCCAUAUCCUUUUUUUCUCUCCUCCAUAGACCACAUAGCCCA +>U2AF2_K562_rep02_2604 +UGUCCCAAAUCUUCUAGGUACCAGGACAUUAUUCACUCUAUUCAUCUAGCACGGAAGCCAA +>U2AF2_K562_rep02_2605 +GUGUGGCUCUGAGCUGAUUCAUUUGCUGCUCAUCGUAUAGGUGCUGCCCAGAGUAUCCUUA +>U2AF2_K562_rep02_2606 +GUAAAUAUCCAUGUGGAAAAAGUAGGGAGUGUGUUGCCCCAAACAUCUGCAAAUGUAAACC +>U2AF2_K562_rep02_2608 +UCUGCUCUUUUCCCACAGCGGGACGACCCUGGGACAGUCUCCACUGGGGCAGAUCCAGCUG +>U2AF2_K562_rep02_2609 +AAACUCAAAAGUGUUCAUUUAUUCCCAUUUCUCCUCAGAUAACUUCAAGUGAUGUACGAAA +>U2AF2_K562_rep02_2610 +UAUUGAAUAUUUUUGAUUUGUCUGCUUUUCUCUCCAUAGAAAGCUUAUAGCUUCAUUGCAC +>U2AF2_K562_rep02_2616 +UUUCUCCACCUUUUAAGGUUUUUGGCUUUCAUCGCUUUUUCUACAUGUUUUUAGCCUCACC +>U2AF2_K562_rep02_2618 +UUUCCUCUCUUUCCAGCUAAUAUGCAAGUGAACCAGUGACCUGCAGUUCUGCCCACACAGG +>U2AF2_K562_rep02_2619 +UUUUUCUCUUCCAUCAAAAUGAGUUUUAGAACUUUGCCCUGAUGUUGACAUUUUUCAUUUC +>U2AF2_K562_rep02_2621 +UCUUUGCCAAUUUUUCCUUCUUCUUUUUUUCCCCAACCUUUUCUUCUUUCCCAACUUCCCC +>U2AF2_K562_rep02_2622 +UAAGGUUGCCUUUUCCACCUUCCAUCCUGUUUCCUUAAAAACAGCAAAUAACAAUCUACAA +>U2AF2_K562_rep02_2623 +AAGGUUGCCUUUUCCACCUUCCAUCCUGUUUCCUUAAAAACAGCAAAUAACAAUCUACAAG +>U2AF2_K562_rep02_2625 +GUUUUCAUUUUGGUUUUCAGGGGAGCCCUGGAAGCUUAUGUUCAAUCAGUGAGAAGUAGAG +>U2AF2_K562_rep02_2626 +UUUGAGACGGAGUCCCGCUCUGUCACGCAGGCUGCCAGGCUGGCGUACAGUGGCGCAAUCU +>U2AF2_K562_rep02_2627 +GACAGGGUCUUGCUCUGUUGUCCAGGCUGGAGUGCGGUAGUGCUAUCACAGCUGACUGCAU +>U2AF2_K562_rep02_2628 +UUUUUUUUGCAUUUAGGCUGGAGGCAAAGCUGGAAAGGACAGUGGGAAGGCCAAGGCUAAG +>U2AF2_K562_rep02_2629 +AUUUUAUGUUUUUCCUGUCUUUUUUUUCCUUUGAGUAACGGUUUUAUCUGGGUCUGCAGUC +>U2AF2_K562_rep02_2630 +AGGUAUGCCGAGCAGACAGCUGGAGGAGCCCGGGGCAGGGACACCUAGCCCGGUGCGUCUG +>U2AF2_K562_rep02_2631 +UGUAUUCUAGAUACAAAUCCCUUCUGUUCAUCAGGGUUGCAGGAUACAAGAUGAAUAUACA +>U2AF2_K562_rep02_2633 +GGUUUAAAUUUGAUGUAAGUUUUUUUUUUCCCCCCAGAAAACUUUAGAAACUGUUCCUUUG +>U2AF2_K562_rep02_2634 +AUUUGUGUUUUCUCUCCCUCUUUUUCUUGAUCAGCAUUAAUAAGGACUUAUAAAUUGUAUU +>U2AF2_K562_rep02_2635 +AUUUGUGUUUUCUCUCCCUCUUUUUCUUGAUCAGCAUUAAUAAGGACUUAUAAAUUGUAUU +>U2AF2_K562_rep02_2636 +CUAUUUCUUUUUUCCAGGAAACCAGGGCUUGCAGAUAUUGGUAAGUUGCCCAAGGUCACAC +>U2AF2_K562_rep02_2637 +UUUUUUUUUUAGGUACUGUCCAAGAAGCUGGAACAUUAUUAUCCAGCAAGAAUGUUCGUGU +>U2AF2_K562_rep02_2638 +AAAAUGUCACUUUUCAUCCCCAGUUUGCCUUUUGUCUGAAAUGCACCAGUGAAGCAAUCAA +>U2AF2_K562_rep02_2639 +CUUUGUUUUCUUCAUCUCCCCUGUAGGGCCAUGUUUAUGAGUGGACUAAGUGAAAGCAAAC +>U2AF2_K562_rep02_2642 +CUUGCCUCCCACCCAGACAUGAGCACCAGCCUCCAGGAAGGCCAGGAGGACGGGCCGGCAG +>U2AF2_K562_rep02_2643 +UUCAUUACUGCACAGGGGUGGCGUACACAUCAGAAUGUUUUCCUUGCAAGCCAGGCACAUU +>U2AF2_K562_rep02_2644 +GUCCCCCUCCCAUGCUCUGUUUUUCAUUACUGCACAGGGGUGGCGUACACAUCAGAAUGUU +>U2AF2_K562_rep02_2645 +GCGGCCUGUCUCCUCCCCGCCAAGACGCCGUGUGCGCCGCCUCGCGCAGCUCCGCCUGGCC +>U2AF2_K562_rep02_2646 +UGUUUUUCUUUCUGUAGCAUGGCAAGGUCACAAGACAUGUUUAAGUAAGGUAGGCUCAUGU +>U2AF2_K562_rep02_2647 +UUUCCAUUAAGGUUAAUGUUCGUGAAGAAAUUGAAGAGUUUUUUCCAAGAAUGUGGAAGAU +>U2AF2_K562_rep02_2648 +UAUAAAUGUGUUACUCACAGCGGUUCAAGUCCACACUGAAGAGCAACAGAAGAGUCAUCCC +>U2AF2_K562_rep02_2649 +UUCUGUAGACCUCGAAGUAGGGGGAAAACUGCAGUGGAAGAUGAGGACAGCAUGGAUGGGC +>U2AF2_K562_rep02_2650 +UUGUUGUUUUCUGAGAUGGAGUCUUGCUGUGUCACCAGGAUGGAGUGCAGUGGCAUGAUCU +>U2AF2_K562_rep02_2651 +AGAUCUUGGGGGCAAAGGAAACCUUGGGGAAGGCAGGCUGGUAAGGGCCUCCCAGGAGGAU +>U2AF2_K562_rep02_2652 +GCCUGGUCAUGAGGCAGGGAGGGGACGGGUGGUGCUGCGUGCAGGGCAAGGGCUGUGGACG +>U2AF2_K562_rep02_2653 +CACUUGAUCUUUUGUUUCCAUGUUUGUCACUAGAUGCCCAUAAAAUUUGUGGAUAAGUGUU +>U2AF2_K562_rep02_2656 +ACCCACAGUUGAAGAUUCCUGUCUCUGGAUCCAAAUCAGAGGGCCUUCUCUACGUCCACUC +>U2AF2_K562_rep02_2658 +UUUUCUUUUUUCUUUUUCAGUUGCAGGAAUUUAGCCAAUUCAGAGGUCUUGUUCUCCAUAA +>U2AF2_K562_rep02_2659 +UUUCACCUCUUGGUUCCUCCCACAGAGCACUCCAGAAGAGAGGCUGCCCGUGGAAGGGAGC +>U2AF2_K562_rep02_2660 +UUCCUGAUAUUGAUAAUUUGUGUUUUCUCUCCCUCUUUUUCUUGAUCAGCAUUAAUAAGGA +>U2AF2_K562_rep02_2661 +AUUCCUGAUAUUGAUAAUUUGUGUUUUCUCUCCCUCUUUUUCUUGAUCAGCAUUAAUAAGG +>U2AF2_K562_rep02_2662 +AUUCUCCUGUUUAGAUAAAGAAAGCCGCCCACCUCGGAAAUUUCCUUCUGAUAAAAUUUUU +>U2AF2_K562_rep02_2663 +UUUCCAUUCCUACAGAACUGAGAGAAGAUGGUUUCCAGCCUCAAACUUACCUAGUACAGGG +>U2AF2_K562_rep02_2664 +GUCCGUUUGCUCUUUUUGUCUCCCAACUAACAGUGGUUUAUCAGAUACUAUCAUUUUGGAU +>U2AF2_K562_rep02_2665 +GUAAACUAUUUGUAUUUUCAGGUCAUAGCCACCUUCCAUUCAUCUUUCAAACAAGUAAUUC +>U2AF2_K562_rep02_2666 +UUGUAGGAAAUACAACUGGAGCACGCAAAGCAAGCCUUUGUGCAACGGGACAAUGCUAGGA +>U2AF2_K562_rep02_2667 +GGCAGAGAAGCGUGGGGUGGGUGGCACAGAGAGGAUGGAGGGAUCAAGAAGGAUGUGUCUU +>U2AF2_K562_rep02_2668 +GUCAGUUCACAUUGAGUCUUCUUUUCCUUUACCCCUCUUCCUCCUGCAGGCAUCUCUAGGU +>U2AF2_K562_rep02_2669 +CUCUGUUCUUUCCUCCUGGCAGGUGACAGAGCUGAAUGAGCCACUGUCGAAUGAGGAACGA +>U2AF2_K562_rep02_2673 +AUGAUGCACUUUAUUCUCAUUCUUUGUGCCAUUUUCUUUUUUCGAUCUUUCUCAGGUAGGG +>U2AF2_K562_rep02_2674 +ACUUUUCUGCUUGACAGGCCGGACAGUGGCUGUGGAUUGGGCCGUGGCAAAGGAUAAAUAU +>U2AF2_K562_rep02_2677 +UUUCUUUUAUGUGUAGGACCUGGAGCCAUGGAAAGAAAACUUGAAGAUCUAUUUUAGCCCU +>U2AF2_K562_rep02_2678 +UAUUUUUCCUUUUUCUCCUUUCAGAUAAACAUCUCUAUUAAAUUAGGAGCUAUCAUUUUUC +>U2AF2_K562_rep02_2679 +UUUUCCCACAGUACUCUUUCCAUUCCUUACCCCAGUUUUUGAAGCAUUAAAUGUCUCUCUG +>U2AF2_K562_rep02_2680 +UCCCUUUCAGUAUUUAGUGUCUCUGAUCCGGGACAAGCUAGGAUGGAUGUGGGUUUUCUAC +>U2AF2_K562_rep02_2682 +CUGUUUUUCUUUCUGUAGCACGGCAAGGUCACAAGACAUGCUUAAGUAAGAUAGGGUCAUG +>U2AF2_K562_rep02_2683 +CUGUUUUUCUUUCUGUAGCACGGCAAGGUCACAAGACAUGCUUAAGUAAGAUAGGGUCAUG +>U2AF2_K562_rep02_2684 +UGUGUGUAUUUUCCUCCUAGGUUCAUUUUCCAGACACUGAAAGAGCAGAAUGGCUAAAUAA +>U2AF2_K562_rep02_2685 +UGGGAUUGGGGAGAUCAUGGAAAUGGAGGAGAGCCUGAGCACCGUAGAUCUUGGGGGCAAA +>U2AF2_K562_rep02_2686 +ACCUCUCUUUUUGUGUCCUUUAAUUAUCUCCCAAGUUUUCUUUAUGUGACUCUUGUACAUU +>U2AF2_K562_rep02_2689 +CUUUCCCUUCCAUUUUUCCUGGGGUGCCUCUCACCCUGCAUCUGCGCGUUCAGCAAGCUGG +>U2AF2_K562_rep02_2691 +CUUCCAUCUUUCAUUACUACAAUUUACCAUGCAGAGCUCACAAUGUCUCUCUGCACCAAGC +>U2AF2_K562_rep02_2692 +CCUGAGCUUUUGGGGCGCGGGUGGGAGCGCGGGGGAACCCUCAAGACGGCUUUCUUUUGGC +>U2AF2_K562_rep02_2693 +UUUUUUUUUCCUUCUCAUUCUAGGUAGAAGAUGUGUUACAACGUUGUCGAGAAUAUUUAAU +>U2AF2_K562_rep02_2695 +ACUAAUUUAGGAUCAACCACAGGUUUGUCUGCUACCCCCCCUGCCUCAUUACCUGGCUCAC +>U2AF2_K562_rep02_2696 +CCUCCUGCUGUUUAUUAGCUUUGUGCGACCCUGUCUGCCUCAAUGGUGGUUCGUGUAAUAA +>U2AF2_K562_rep02_2698 +CAGAACAUCUUCCUCUUUGGCAGGUCUUCAAACUUUGGUGCUGAAGCUUUCGUUAAAAGGA +>U2AF2_K562_rep02_2699 +UCCCCCAGGUUACCCUUAAGUUACAGGAGUCCCAGCUGCCUGGGCCAGACCAGUUACAGCA +>U2AF2_K562_rep02_2700 +AGGAUCUCCUUCUGUCCCCUAGGCCGGAGAGCAGUGGGGCAAUCAUGGCUGACUGUAGCCU +>U2AF2_K562_rep02_2701 +UGACUUUAUUUUCCUAGGGGAAGAAGAUGGCUCUCUGUACCAACAAUAUAACAGACUUUAC +>U2AF2_K562_rep02_2702 +UUUGUUUGUUCUUCACAGGAUGGACAACCGGAAAUUUUCUACACAUUUUGGAAUUCAGUUA +>U2AF2_K562_rep02_2703 +UGUUACAGGCUUCUCCCACCUGCCCAGUGGGCUGUACCCAUCCUACCUCCACCUGAACCAC +>U2AF2_K562_rep02_2707 +UUUAACUUUUCUUCCAUACAGAGGAGUUUGUUCUGGCAGCUCAGAAAUUUGGUCAGGUUAC +>U2AF2_K562_rep02_2708 +UCUUCUUUUCAGGGUGUUCUAAGGAUACAUUUUAUUGAAGCUCAGGAUCUUCAGGGGAAAG +>U2AF2_K562_rep02_2709 +UUUGGGCCUUGCUUCUCCAUGCCCAGAGGCAAGCCCCCCGCCCCAUCCCCUAGGGGACAGA +>U2AF2_K562_rep02_2710 +UUCCCACUUUUUUGUUUCUAGACUGAGUGUACUUGGUCUGGUAUUUGUGGCAUAACUUACG +>U2AF2_K562_rep02_2711 +UCCUUUCUUCCAGGUUGUUUUUGAGCACGUUCACUCUCGCAGUGUCAGCUGGGGCUGUUUU +>U2AF2_K562_rep02_2712 +GAUUAGGGAACGACAGUGGGUAGAUGAUUUUCCUCUCCACCGAAGCGCCUGUGAAGGAGAU +>U2AF2_K562_rep02_2713 +UAUCUUUUAAUUACAGACGCAGGGACAGAGCUCAUCGGGAAAUCAAGGAUAUUUUCUAUAA +>U2AF2_K562_rep02_2714 +UAUCUUUUAAUUACAGACGCAGGGACAGAGCUCAUCGGGAAAUCAAGGAUAUUUUCUAUAA +>U2AF2_K562_rep02_2715 +UUUUGCUUUUUCUCUUUUAGGACGCUAUUGAUAACGGAAUGGUUGCAAUUAAGGACAUUUU +>U2AF2_K562_rep02_2716 +GGGAUUGGGGUGGGUGUUUGUCUUCCAUGUAGUUUAUAUCCUGGAACCUGGAGAUCCUCCU +>U2AF2_K562_rep02_2719 +AUUUCUAGGUAUUAAACUUGCUGCUGCUGUUGGGCUUUUUCCACAUUUUGUCUUCUGUUUU +>U2AF2_K562_rep02_2720 +CCCCCUUUUCCUUCCAGCCUUUCAUUCUACAGACCUGGACUUCUACUCUUUGCUGCUUUUG +>U2AF2_K562_rep02_2721 +AUUAAACAUUUAUGAAGAAUCACCUGUGCACAGCGCUACGCAAGAAGAUACAGAGACAUAA +>U2AF2_K562_rep02_2722 +CCUUUCUUCCUUCCCUUCCUUCCUUUCCCCUUCUCCUUCCUUUCUCCCUCCUUCCUUCCUU +>U2AF2_K562_rep02_2723 +CUUUUUUGUUCUUUUUAGGCUGGAGGCUCCCAGGUGAUUUUCACAAAUCCUUUAGAAAUCG +>U2AF2_K562_rep02_2724 +UCUUUUUAGAUUUUGUGGUGGAUGCAACCCGCAAGGGUAACAAAAUUCGUUUUGCAAAUCA +>U2AF2_K562_rep02_2725 +UACCUGAUUGCCUCCUGCUUAUUUCUUCUGCCUGUCUACUUUCCAUUCUGCUUUUACAAUG +>U2AF2_K562_rep02_2732 +UCUUUUUUCCCAGUGCCCUUCUUCAUUCCAGACAUGGUGCUUUGAACAAUUUGACUUGGAG +>U2AF2_K562_rep02_2733 +UAGCUUACAGUGCUUGAAUGAAACACUCACAUCAUGCACAAAAGAAGUAGGAAAGGCUGCU +>U2AF2_K562_rep02_2734 +UUCCUAAUUUGGCAGCAGAAGGGGGAAAAACCAGGGCCUUUCACAGACAAGGCUUGUUUUA +>U2AF2_K562_rep02_2736 +CCUUUUCCUUUUUUUGGUCCUUAGGUUCUGAGUUACUUUCACCAUCAAAAGAAAGUUCGGC +>U2AF2_K562_rep02_2737 +UUUGAAUCCUUUGCAGCCCACACCCCACCUCCAGUUCCAACUCCUCCACUUCCUUCCAUUU +>U2AF2_K562_rep02_2741 +ACUCUGAUUCUGCCCCGGCUGCAGCAGGAAGGGGAGCGGAUCCGCAGUGUGCUGGACGGCC +>U2AF2_K562_rep02_2742 +CUCAAGUGUUUUUUAAGGUACACCCAAGCCCCUUCAAGAUGUAACUUGACAAAUUUUUUAA +>U2AF2_K562_rep02_2747 +ACACACUUUUUUUUAGGGGCUGGGCCUGUAUGCUGCUCGAGACAUUGAGAAACACACCAUG +>U2AF2_K562_rep02_2749 +UAAGUAUACUUAUCACUGCAGGUGGGUUCACCUAGAGUGUGACAAACCAACAGAUCAUGAA +>U2AF2_K562_rep02_2750 +UCUUUCCCAAAACUAUUCAGGAUUUUUUUCCUCAAGUGGCAAGUUGCCCCAUUUUAUAACA +>U2AF2_K562_rep02_2751 +UGUAGCCAUCAGCCAGCAAAGACCUCGUCAGUGUCUUUAACUGCGACCUUUCGUCCUCAGG +>U2AF2_K562_rep02_2757 +CUCCCAUCUUCACCCCACCAAGGCCGAAUGGGUAAUAGCCGAAGUGCCCUGAAGAUGAUUA +>U2AF2_K562_rep02_2761 +UGGGACUUUAUCUCUACUUUUUCCUUUCCUUUCCCAGCCAUUAAAAUAGGGUGAGAUGGUU +>U2AF2_K562_rep02_2762 +AUUUUCUAGAUCCCAAGCAGGUCUGUUCCAGCCUCUGAUUGUGUAUCGGGGCAAGAUUUGC +>U2AF2_K562_rep02_2763 +UUCCUCUUCUAGCCUUUCAGUGCUACCUUCAUCUCUUUCAGUUUUUCAAAAUCCCACAGAU +>U2AF2_K562_rep02_2765 +UACUUUUCUCAUUUUGUUUGCAAUCUUGGUUGAACAUUACAUUGAUAAGCAUAAGGUCUCA +>U2AF2_K562_rep02_2766 +UCUGCCACAGGAAGCUGGGCCGGGCUGCUGUGCCUGGGAGGAGGGAAGGAGGAAUGAGAAA +>U2AF2_K562_rep02_2767 +UUUUUCUCUCAUCAGUUUAGGUCUUAGGAUCUACCAUCUGUUACUUUUCAGUUUCUCAUCU +>U2AF2_K562_rep02_2775 +CUUUUCUCCCUUUUGCUUCACUUUCCCUAGGUCUGUUUCAUUCACCUUUUUAAAUAAAAAU +>U2AF2_K562_rep02_2776 +UUUGUUUUUUUAUACAGGUAUGGAAAAGUUGAGGCCACUCGCAUAUUGUUAGAGAAAGGAA +>U2AF2_K562_rep02_2777 +CCAGGCUUUUUCUCCCUUUCUCUCACACUCAAGGAAACAGGUGAAUAAAAGUGACAUGAAG +>U2AF2_K562_rep02_2778 +UCUUGUCCACUCCCCCAAGGCGUGCCCCACUUCCGCAGUGCUGAGUCCCAGCGGGGAGCCC +>U2AF2_K562_rep02_2784 +UUCUUUGUUCAGGUGGAGUACAUCCUGCUGCUUCAAGGGUAGAAGACUCCUCACUGCUUUC +>U2AF2_K562_rep02_2791 +UUACCUCCCUCCAUAGGUGAGGAAAAGAGCCAUGAAUCUAAACAUCAGGAAUCAGUUAAAA +>U2AF2_K562_rep02_2792 +AAUAUUCUUCCUUCCUGACAGGGGGAGUCGGUGAAGUACUUCCUGGACAACUUGGACCGGA +>U2AF2_K562_rep02_2797 +UGCCUUAUCUUUUCAUUUGAUCUCACCCUUAAAAGGAAAAAAAUGUUAUGAAAUAAGAGAA +>U2AF2_K562_rep02_2798 +CUGUCCUCUUUUCCCCCACAGACCUGGCGCACUGUCAUGCCUACCUGGUAGAAAUGAGCCA +>U2AF2_K562_rep02_2799 +CGUCCCCUUUUGUACAUUAGCAUAUCCCAGCAGCUCGUGGAAGCAUUUGUGAACGAAGAAA +>U2AF2_K562_rep02_2806 +GUUACCCUUUUUAUAGGUUUGUGGAAUCUUGCUUCCCUUUUUUCCAACCUUUGUUUAUUUG +>U2AF2_K562_rep02_2807 +UUUGUCACUCAGCACUUUUUCUCCAUAUUCUUCAAGACGAUUGUGAGUAUGGUACGUAACA +>U2AF2_K562_rep02_2808 +UGUUGUCUUUCUCCCACCCCGUGCAGAGUACAUCCAGAAAUACGCCACGGAGGAGGCGCUG +>U2AF2_K562_rep02_2809 +UUUUAUUUUUUUUGCAGGAAAUGGGGCAGCCUUGAGGUCAGACUUGGAAUUAUGUCCUAGC +>U2AF2_K562_rep02_2810 +CUUUCUGCCUUCCUCCUCUCCAGGAAGCUCAAAGGCCCUGUGGCCCCCCAAGAAUGGCAGG +>U2AF2_K562_rep02_2813 +ACACUGCGGAUGCUGGGGGGAGGGGGGAUUCCACUCCUGUUUUGUGAGUAGGCGACCCAUG +>U2AF2_K562_rep02_2814 +UUCUCUUUGCUUUUCAGGAUUCCCGAGAAAGCACCAAGAGGGUAGAGAAGGACAUUGUCUU +>U2AF2_K562_rep02_2823 +AUAAUUUUCUUCCUCCCUUCAUUCAGGUUUCCACUAAAAUGUCAACUCAGUUCUGAUCACA +>U2AF2_K562_rep02_2824 +UAUAUUCCUCCUCCUAGAAGUCUCAGGGGAUCCAGAACUGCAGCCAGUCCUUGCUGGGCUG +>U2AF2_K562_rep02_2825 +UAUCUUCUUGUUUUUGGACAGUUCUGCUCAGAAGGAAAGGUGUAUUUGUCCAUGUUGGAAG +>U2AF2_K562_rep02_2826 +GACCCUCCGGCUUUUGCUUGUCCUUUUCCCUUCUAACAGGUUAUCAAGACUCUGAUUCUGC +>U2AF2_K562_rep02_2827 +GCUUUUUUCCUAUCUUCUCCAGGUCUGUGAAACGUAAGUAUAGCUACCCCAGGCUUAAACU +>U2AF2_K562_rep02_2830 +UUUAUGCUUUUUGUCCCUAGCUGCUACUGUUUGAACGGUCUUGGAUGAACAGAUGGAAGUC +>U2AF2_K562_rep02_2831 +AUUUUAUUUUAUUUUCAGAGAACGAUCUCCUCAGCAGAAUAUAGUAUCUUGUGUAAGUGUA +>U2AF2_K562_rep02_2832 +CCUUUUUUUCUCCUACUGGGGUGUUUACAGGGCAUGGUAAAAGGAAUAAAGGUGAAAAGAA +>U2AF2_K562_rep02_2833 +UUUCCUCUCUCCCUCCUCCUCCCACAGGAGGAAAUCCUGAGCAGCCUGUUCAACUAGAAAA +>U2AF2_K562_rep02_2844 +CCUUACUCUUGUAGAUAUUGGUCCUGUCACUGAUGAUCCUUCCUCUUUGCCUCAGCCAAAU +>U2AF2_K562_rep02_2845 +AUUUCCUUAGGCUCACGCAGCCCUAGCAGGAGCCAACACAGGUAGGUGCACUGAAGAUCAA +>U2AF2_K562_rep02_2846 +CUGUCCACUAUUAUCCCAUAAUCUCUUUUCACCUUAGUUUCAUUAAACAUUUAUGAAGAAU +>U2AF2_K562_rep02_2847 +GACUGACUUUUCCACAGGGGAAGAAGAGGUGAAGGUUUCGACCAUGCCACUGUCAACCUCU +>U2AF2_K562_rep02_2848 +UAUUUUCUCAACUGCCAUAUCCUAGGGGGCUUGGAGUACCCAUAAUACAGUGAGCCCACCU +>U2AF2_K562_rep02_2849 +AUUGUUUUUGUUUCCCCUGAUAGCCUCUGAGUUCCUUCCGGAUAACACUGCAUCAACAAUG +>U2AF2_K562_rep02_2850 +CUGAAAAGUGUCUUUCUCCCACCCCAGGGGCCUGGAAUAGGAAAUGCCUCUCUUUCUACGU +>U2AF2_K562_rep02_2851 +AACAUUUUUUCUGCCUUCAGGAAGCCCUCAAUCUAGAAGAGUAGAGGUCCAAAGGUGCCAU +>U2AF2_K562_rep02_2857 +CAGUGCUUCCUCAUUCUCUUUUAAAACCCGCUUCCCGCUGAGUCUGCACCCAGGAGACCAG +>U2AF2_K562_rep02_2858 +CUCCUAUUUUUUUCUCAUUCUCCUGUUUAUUCCUCUGUUUGCUUAGUUUACAGAAAACGAG +>U2AF2_K562_rep02_2859 +AGGUACGUAUUUGGGUUUGCCUGUGGGUGCCUGCCCUCCUACAUAGAGCCUUGAUCUUCCA +>U2AF2_K562_rep02_2860 +GUUUUUGCCCCCUCUCUCUUUCUGACAGCACACACAUGCCCUCUUGGUUCUGUUUCUUUGA +>U2AF2_K562_rep02_2861 +UUUGUUUUUUUGCUGUGCCCUAGACCGUUACAUAACUGAAGACUCCCACCUUCAGGCAGGA +>U2AF2_K562_rep02_2862 +UUUCAUGCUUCCUUCCAUUUUCGUUUUCGUCAUUUAAGGUGUAAAUGUACAUAAUUUAUCC +>U2AF2_K562_rep02_2882 +AUUGGGGAGAGGUGGGGGUGGGGGGUUCCCACUCCACACUGGUCACCCACCCACAGGGCUA +>U2AF2_K562_rep02_2883 +GUUUUCUUUUUAUAGCCCCAUUGACAAACCUUCAGAUUCUCUCAGUAUAGGGAACGGUGAU +>U2AF2_K562_rep02_2884 +CAAAUGUCUUUUCUCUAGCCUUCCAGCAUUGGGUCCAUGGCUCUGACUGAGAGUGCACUAU +>U2AF2_K562_rep02_2885 +AUAUUUAUUUAUUUAUUUUAGGCUGAGCCAUUGAAAGUAAGUGCAAAAGCCCCUCUUUGGU +>U2AF2_K562_rep02_2886 +UUACCAUAUUAAUGUUGAAUAGCAUCUCAGGUUUCAUUUCACAAUGCACGCAUGGAGUUGG +>U2AF2_K562_rep02_2887 +CCUUCAUCCCACGUUACCCUCUUCCCCUCCCCUUAUGUCUCAAUAUGCCUCUGCCUUUUGC +>U2AF2_K562_rep02_2888 +GGAGUGAACUUUGCGCACUUUCUUCCUUAUGGCAGUGGCCAAUUUAAUAGUGGGAAUCGAC +>U2AF2_K562_rep02_2889 +UCAGAGUUAUCAGGUCUCUUUUGCCCCUACAGGUUUUUAUGUGAUAGUCAAAAGGAGCUGG +>U2AF2_K562_rep02_2905 +UUUCCCUUUUCCUUACCUAGGCUAUUAGUCCUUAUUUGCCAAGAGGUGAUCCAGUUCUGAA +>U2AF2_K562_rep02_2906 +GGAUAAAUAUAAAGAUACACAGUCUGUUUCUGCUAUAGGUAAGAUGUGGUAGUGUUGGGUG +>U2AF2_K562_rep02_2907 +AUUUGGUUUUAUUUGCAGGUCCUAAUCUACCCAUGGCUACAGUUGAUAUAAAAAAUCCAGA +>U2AF2_K562_rep02_2908 +UCUUUUUCAUUCUGCAGAUUGCAGGAAUUGACGCUGUAUAAUCCAGAACGCACUAUUACAG +>U2AF2_K562_rep02_2909 +UCCUUUUCUUUUCCUCUUUCUCCUCCUCUUUUUUCCCCUUCUUCGUCCUCUUCAUUGUUGU +>U2AF2_K562_rep02_2910 +CUACUUUUAGGAUUCCUAAGGGAUUUGUGUGAGGUCUUACUAUAUUUAUUGCUACCUCCUG +>U2AF2_K562_rep02_2912 +UUUAGAACAUUAGCAGUGUUGUGGCUGCAUUUUCCGACCUUCUUCACGUCCGAAUCCCUAA +>U2AF2_K562_rep02_2928 +UUCCCCUUAAUCACACAGCAUUGGCAUCAACAAAAGUCAGAAUUCCCGGGAACUUGAACAG +>U2AF2_K562_rep02_2929 +UUUCUUUCUAGGGGUUUAGUGGUUACUCUCCUGUUUGGAAAAACAAACUCAGAGAAGUACC +>U2AF2_K562_rep02_2930 +UCAGCUCAGGUACCUGACAAUGAUGAGCAGUUUGUACCAGACUAUCAGGCUGAAAGUUGUA +>U2AF2_K562_rep02_2931 +UGUUUUUGUCUUUGUUCCCUCAUUCCCAGGUGCUAGUGUAUGAGUUGUUGUUGGGAAAGGG +>U2AF2_K562_rep02_2932 +AGUGGGGUGCCAUUUUCUUCCUGCAGGUGCUGGGUGAAGUUCAGAAGGCUCUGAGAGGCUG +>U2AF2_K562_rep02_2933 +UUGAAUUUUCUCUUGUUCACAGGUGGAGAUACACUACGCCUUGACACACUUAUAGAAUGGU +>U2AF2_K562_rep02_2934 +UUAUUUGUACGUUGUGUUCUGGUAGUAGGGGUUUAGGAAUAUGGUUUUGAGUAAGAGACUC +>U2AF2_K562_rep02_2935 +AUGUUUAAUUUCCUUUUUCCCUGUAGCUUUUACAAAGUUGAUCACAGUAAAUGGACAAGAA +>U2AF2_K562_rep02_2936 +AUUACUUCUAGGUUGGGAGGUGGCUGGAGAUCAUAUCCAGAGUGGGGCUGGAGGUUCUGAC +>U2AF2_K562_rep02_2937 +CUUUUCCCACCCCUGCCCCUUUUCAACUUUCAGAGCACUAGACAAACUGAAUGGAUUUCAG +>U2AF2_K562_rep02_2938 +UUCUUUUCUUUUUUCUCUCAGGAACUAAACAACUUAAGCAUAUUUUAUUAAAAGAUGUGGA +>U2AF2_K562_rep02_2939 +ACCUCUUUUCCCACAGUCGGAGUCUCAGGACCAGGUCUUCCUACGCUGGAGCAGCGGGGAG +>U2AF2_K562_rep02_2940 +UUUGUUGCUUGUGUUUGUUUUUCCCCUACAGACGUAUGACCUUAGCAGACAUUGAACGGAU +>U2AF2_K562_rep02_2941 +AAUGACUUCAUUUUUCCAGGCCCCAAAUUCUCACCAGUCCGUCUCCUUCAAAAUCCAUUCC +>U2AF2_K562_rep02_2957 +UUUGUCCUAGUUUUCCUAAAAUUCCCUUUUCCACUGGUGUGUGGUGCAAGAUGAGGCACAU +>U2AF2_K562_rep02_2958 +UCCUUGUAUUUUGUGCAGGUCUGCAGACUCGUGAAUGAGGUCUACCACAUGUAUAAUCGAC +>U2AF2_K562_rep02_2959 +UUAAUUAAUGUAUUACUUUCUCCCUUAUUUUUUCCUUGGAUUCAUUUUACUAUUAUUCAUG +>U2AF2_K562_rep02_2960 +AAUCUUUAUUUCCUUUAACUCCUCAGCACUUGUUUUAACUUGCUUAUUUUCUUUAGUUUUU +>U2AF2_K562_rep02_2961 +CCUCCCCUGUGCCUUCCACAUUCUACACCCUUUACCACAGGAGAGGUCUCUGUUAGCUUGC +>U2AF2_K562_rep02_2962 +GCUGUCUUAUUUCUCCCUUCCUUUAGAAUCCCUUCUUUUUCAAAACACUAGAAACCUCCCA +>U2AF2_K562_rep02_2963 +UAGGUAGAUAAAGUGGUAAUAAAUCCAUACUUUGGUCUAGGAGCUCCAGACUACUCAAAAA +>U2AF2_K562_rep02_2964 +AACUCUCUUUUUCCACCCCCUAAGUCUCUGGCAACCACUGUUCUGUCUCUGAAUUUGAUAC +>U2AF2_K562_rep02_2965 +GUCUUUCAAUAUCUCUUCCCUGUUUGGACCACAUUACCCUUCAUCAUAUGAAGCCUUGGGU +>U2AF2_K562_rep02_2966 +UUCUCUUCGUUUUUCUCUUCCUCUAGUGAACACUGACUCGGAAACUGCAGUUGUAAAUGUA +>U2AF2_K562_rep02_2967 +UUUUUUUUCUUUACUUACAGGCAGUACUUAAUUUUCCUAAAUAUUGUGAACCCGUGGUUAA +>U2AF2_K562_rep02_2968 +UUUUGAUCCUUUGUUUCAGACUCUGCCACAACUGAAAGCUCACCAACAGCCUGCCAAUAAA +>U2AF2_K562_rep02_2969 +UCUCUCCUUUCUCUGCAGGGCACCCUCCCCCAGGAGACUUCAUUGCUCUGGGCUCAAAGGG +>U2AF2_K562_rep02_2970 +UCUAACAUUUACCAGUUUUGCUUCCCUGCUUUCUUCCUAACACUGAUGAUGAUUUUUAUUU +>U2AF2_K562_rep02_2971 +CUCUCUCCCUUCCUCCCAUAGAGACCAGUCUUGGGGAACCACCUUUGAGGUUUGUGUGGAG +>U2AF2_K562_rep02_2972 +UUAUUUCUACCCUCUUCUCUCCUCACUCCCCAGCCCCCCAACUUUACCAUCUCCUCAAGAA +>U2AF2_K562_rep02_4839 +UUCCUUCCUCUGACGCCUGCUCUUACAAUAGGCGUCCCUGCGAGAAGAGUCACCCAGUGGC +>U2AF2_K562_rep02_4840 +CCUUCCUUUCAAAUAGAUGUCUGUGGACUUUAUCCCCAGGAAUGGUCUCUUGGUUAAAGUG +>U2AF2_K562_rep02_4841 +CACUGCUUAGCUUUGCUGGUCCAUUUGUCCCUGUGUUUUCCAUUUGCAUUCAGGCCUUUGA +>U2AF2_K562_rep02_4842 +AUGGUUCACCAUCUGCCACUUCUGAAAGUGAUGGGUCUAGUACAGGCUCUCUGCCGCCGAC +>U2AF2_K562_rep02_4843 +AUGGUUCACCAUCUGCCACUUCUGAAAGUGAUGGGUCUAGUACAGGCUCUCUGCCGCCGAC +>U2AF2_K562_rep02_4844 +CCCUCCAGGUGCCUCAAUGGUCCGGCCACCAGUUGUGCCUCGGCGCCCCCCGGCCCACAUC +>U2AF2_K562_rep02_4845 +AGAUGCGAGCCACCCCUCUGGCUGCUCCUGCGGGUUCCCUGUCCAGGAAGAAGCGGUUGGA +>U2AF2_K562_rep02_4846 +UUCCUUUUCCCCUCUUCUUACCCAGAGUGAGCACAAAUGGAUCAGAUGACCCUGAAGAUGC +>U2AF2_K562_rep02_4847 +UUCCUUUUCCCCUCUUCUUACCCAGAGUGAGCACAAAUGGAUCAGAUGACCCUGAAGAUGC +>U2AF2_K562_rep02_4848 +UUUCUUCUCCUGUGACAUUAUCUAGCAUGCUUUGCAGUGGGUCCAGAGUUGUCUGGGGAUC +>U2AF2_K562_rep02_4850 +CUUUCUUUUUGCCUAGGAGCCAUAUGGGGGUGCCGUUGGUCUCUGGUCACCGACAUCCUUU +>U2AF2_K562_rep02_4851 +UUUGCAUUUCUUCCCAGGCUGCCAGCGGGACCAGGAUGGCUAUUACUGGAUCACUGGCAGG +>U2AF2_K562_rep02_4852 +UAACAUGGCAGACCAGAGACAGCGCUCACUGUCUACCUCUGGGGAGUCAUUGUACCACGUC +>U2AF2_K562_rep02_4853 +CAACUCAUUGUUUGUCCACAGGUGCUGGCUUAUUCUCAGACUCUGUAUAUUGGGAGAGAAA +>U2AF2_K562_rep02_4854 +UUGGAUUUCUUGCUUAAUCAACUCAUUGUUUGUCCACAGGUGCUGGCUUAUUCUCAGACUC +>U2AF2_K562_rep02_4855 +UUUUUCUUUCCUUCCCCACACCCCAGGGCUACCAAGAAAAGAACAAAUUCAUUGCUGCACA +>U2AF2_K562_rep02_4856 +UUCUCCUUUGCAGCAUCAUGGCCAGCCCAAGAACCAGGAAGGUUCUUAAAGAAGUCAGGGU +>U2AF2_K562_rep02_4857 +CCUGUUUUGUCUUUAGGGUGUACAACUAUGAGCCUUUGACACAGCUCAAGAAUGUCAGAGC +>U2AF2_K562_rep02_4858 +AAGAUUCUUUUCCUAUUUUCCCCAAAUCUUUUAUAGCAUCUGUCAAUGGUUCACCAUCUGC +>U2AF2_K562_rep02_4859 +AAGAUUCUUUUCCUAUUUUCCCCAAAUCUUUUAUAGCAUCUGUCAAUGGUUCACCAUCUGC +>U2AF2_K562_rep02_4860 +GAUGCUUUUUCCUCAGGUCCUGGGGACCUGGCCUCCCUCUGUCAGCAGUUUCUGACCUAAU +>U2AF2_K562_rep02_4861 +GGUCUUUCCUUGUCCAGUUCCAGGUCGCGGAGCAAAGGUCGAUCACGUUCUCGAUCAAAAG +>U2AF2_K562_rep02_4862 +UGUAGCUUGCUGAUGACCGUAUGGCACUGGUGUCAGGCAUCAGCUUAGAUCCAGAAGCAGC +>U2AF2_K562_rep02_4863 +CUGUAGCUUGCUGAUGACCGUAUGGCACUGGUGUCAGGCAUCAGCUUAGAUCCAGAAGCAG +>U2AF2_K562_rep02_4864 +GAAAACUUCCUGUUGCCUGCAGCCGCCCACGCAGAACAUGAACCUGGGCCCUGGAGCCCUG +>U2AF2_K562_rep02_4865 +UUGUCUUUCAGGAUUUUAUGCGACAAGCAGGUGAAGUAACCUAUGCGGAUGCCCACAAGGA +>U2AF2_K562_rep02_4868 +CCAGCAUCUUCGGCCUCUUGUCCGCUUUGUUUUCAGGGCCCAGGGGAAUCGCUACGUGGGG +>U2AF2_K562_rep02_4870 +CCUUUCCUUUUUCUUUUCUCCUCCCCCUUCUGUUUUGAAAAUCAGGUUGCUUUUCUGUUAC +>U2AF2_K562_rep02_4871 +UUCAAAUUCAGGUGUGCACUCUCCCAUGGCAUCUUCUGGCAAUACUGGGAACCACAGCUUU +>U2AF2_K562_rep02_4872 +CUUAAUUUUACAGGUGUGAGCCACUGCACCAGGCCCCUUCAUCUUAAUUUUAAUAUAUCUU +>U2AF2_K562_rep02_4873 +UGUGUCCUUCUGUCCACAGUCCCUGAGACGGCGGGCAACAGCAUCGGCAGGAACGCCAUGG +>U2AF2_K562_rep02_4874 +UCCCUGAUUUUCUUUUCAGACGUCUUUUUACAAGGGAAACGGUUCCACGAAGCCUUGGAAA +>U2AF2_K562_rep02_4879 +UAAGUUUUUGUUCAAGGUGACGUUACUGAGGCAGUGCUCUACUGAGAAUGAAAAUGACAUG +>U2AF2_K562_rep02_4880 +UAAGUUUUUGUUCAAGGUGACGUUACUGAGGCAGUGCUCUACUGAGAAUGAAAAUGACAUG +>U2AF2_K562_rep02_4881 +AAUUUGUGCUUUCUUUUUGCUCCCCCAGGGCCUGGUGAAAUCCCCAUGGGAAUGGGGGCUA +>U2AF2_K562_rep02_4882 +CCAGGACCUACUUGCUCAGAUCUCCAAGCAAGCAUUUCUUUUCUUUUAGGGAUGUCUGAAA +>U2AF2_K562_rep02_4883 +UCUCCUUUCCCCCCUUUCUACGCCUUUUCCCUUAGUCUUACCUGCAGUGGUGAAAAACGGA +>U2AF2_K562_rep02_4884 +UUUCUUUGCCAGAUCCCAUGAGCUGCGUUCCAAGGUGGUUUCCCUGCAGCUGCUCCUCUCU +>U2AF2_K562_rep02_4888 +UCUUGCUUUUCUCCUAGGCUUGGCACUGCUGCACCACCAAAGGCAAACUUCAUUGAAGCUG +>U2AF2_K562_rep02_4891 +UACUUUGGCCCCCUUCCCUGCUGUGGUUCUGGCCACCCCAGAGAGGUGAUCGAGAAGAAAC +>U2AF2_K562_rep02_4894 +UUUCUUUGACAAUUUUAAGCCUUGUCCUAGGUUAAGACUGAUGAACAGGAGCCAAAGAAGA +>U2AF2_K562_rep02_4895 +UGCAGCCAACAUUGGUACUCAGACCACAGGACCCAGUGGGGUAGGAUGCUGUACACCAGGC +>U2AF2_K562_rep02_4896 +CUCUUGCUUUCUUCCAAUCCAGGACUCCAUUAUUACAGUCUUUGAUUGGUCUUUUUGAGUU +>U2AF2_K562_rep02_4897 +UAGAGACUGCCUGCCUUUUCUCUCCUGGUCCCACCUCAGCUGACCCUCUGUCAGCUCGAAU +>U2AF2_K562_rep02_4904 +UUUUUAGAUAAUGAGCUUCAGUCCCCAAGAUCUGCGAAGACGUUUGUGGGUGAUUUUUCCA +>U2AF2_K562_rep02_4905 +UUUUUAGAUAAUGAGCUUCAGUCCCCAAGAUCUGCGAAGACGUUUGUGGGUGAUUUUUCCA +>U2AF2_K562_rep02_4911 +CAUCUUUUCUCUCCUGUAGUCUAAGGUUGUGGGUGACAGAGAGAACGGCAGUGACAACCUC +>U2AF2_K562_rep02_4913 +CCUUUUAGGUCCUUUUGGUGUGAACCAUGGGGUGGAACUUCACUCAGAUGUGAUAGAGUAU +>U2AF2_K562_rep02_4914 +UUUUUCAGAUAUGAGGCCCCAGGAUUCCUGGCGAGGUCCUCCUCCCCUUUUCCAGCAGCAA +>U2AF2_K562_rep02_4916 +UUAUCUCCUUAGGAAUACAAACAGAAGCUUGCACGAGUAACCCAGGUCCGCAAGGAACUGA +>U2AF2_K562_rep02_4922 +AUUUUUUCUUCCUAUAACUUUUCUUCUCUCAGGUAAACUAUCCUUUAAACUUUUGUGGAAC +>U2AF2_K562_rep02_4923 +AGUUUUGUUUCGUUUCUCCUUUUAUUCUCUGUAUUGAGCAAGUCUUAGACAUCAUACGUUU +>U2AF2_K562_rep02_4928 +GUGUGUUUUUCCUCCCCAGAAGAGGCGACAAAGGCCGUGACAGAGAUGAACGGGCGCAUCG +>U2AF2_K562_rep02_4929 +AGCUUAUUCUCUUGGGGGCCAAGAGAAUCUUGGUCUGAUCUCAGCUUCUCCACAAUCAGAU +>U2AF2_K562_rep02_4935 +UUUCAGGGUUAUUUUGGAGCUGUUGGAGCACUCCUUGAGCUGUUGAAGAUCCCGUGAUCAU +>U2AF2_K562_rep02_4936 +CCUUGUGCUUGUCCCCAGCGGCAAGCCUGCACGAGCUGUGUGCUGCCAGAGUGUCAGAGGU +>U2AF2_K562_rep02_4937 +UCUCAUAUUUCUAAUCCUCAGGGGUGGCACACACUCUGCAAGCAUGGUGCUAGGCACACGG +>U2AF2_K562_rep02_4941 +UAAAAUGUUUAAUUCCCUUGCUAGCUUGUGAGAAGAAUGAGUUGAUGACAUGCUCCAUACC +>U2AF2_K562_rep02_4942 +UUUUUAACAUAGGCAUACUGCAACCCAUGGGUUGUGUUCCCCAAGUGAAGAUUCUGUGUCU +>U2AF2_K562_rep02_4951 +UUUAUCUUUUUUGGUCCUCUGCCAGCGAACACUUGCCAAGUAUUUCAAUCCUUGCUAUGCC +>U2AF2_K562_rep02_4952 +UCCAAGGGGCAGUUGAAAGCACUUUUUUCGGAACACGAGGUAAGCUGACUUGUUCGUUGUG +>U2AF2_K562_rep02_4953 +AUUCCCUUUUUUCACAUGGCUGCCAAGAAGCUCAGGUUUACAUUUUUUCUCUGUGACUAAG +>U2AF2_K562_rep02_4954 +UUUUGUCCUCAGAAAAGGAAAUCCUCGCUUCCAUGGCUGCCAAAAGGACAGUGUUUCUGGC +>U2AF2_K562_rep02_4965 +GUCUUCAUUUACUAUAUUAUGUAGGGUUUCUGUCCAACAAGAGUACUUGUAUAUCUUUGCU +>U2AF2_K562_rep02_4966 +GCCCCUUUCUUCUGUCCCCAGGGCCUCGGCUUCACAGGAUGGGGCUGCCAGUGUCCUGGGC +>U2AF2_K562_rep02_4967 +GCCCCUUUCUUCUGUCCCCAGGGCCUCGGCUUCACAGGAUGGGGCUGCCAGUGUCCUGGGC +>U2AF2_K562_rep02_4973 +CCUAAUGUGUUUUUUCUUCCUUCCUUACCAGAUGAAAUUAAAGCAGAAAUAGAAAAGCAGA +>U2AF2_K562_rep02_4974 +GCUUCGCUAUUCUUGCAGGUGGAUGGGCAGGUGGUAGCACUGCUGGUACAGAAUCUGGAGC +>U2AF2_K562_rep02_4975 +UGUGUGACUUCGUCCCUUAGGAGCUCAGCCUGAGGAAGAAAGGCCUGGAGUGCCUCGUGUC +>U2AF2_K562_rep02_4976 +GUCCCCCCUUUCCUGUGGCAGGGCCGGAUCGUGGCACCCAGAGGCUGCCAGGACUUUGGCU +>U2AF2_K562_rep02_6000 +UUCCAUUGUUUUUUUUAGAUUCUCUCGGGCCUAGCCGUCCUUGGAACCCGAUAUUCGGGCU +>U2AF2_K562_rep02_6001 +CUCGGGCCUAGCCGUCCUUGGAACCCGAUAUUCGGGCUGGGCGGUUCCGCGGCCUGGGCCU +>U2AF2_K562_rep02_6002 +CCGCGGCCUGGGCCUAGGGGCUUAACAGUAGCAACAGAAGCGGCGGCGGCGGCAGCAGCAG +>U2AF2_K562_rep02_6003 +CCGUCCUUGGAACCCGAUAUUCGGGCUGGGCGGUUCCGCGGCCUGGGCCUAGGGGCUUAAC +>U2AF2_K562_rep02_6004 +UAUUCCUGUUCCCUUUACCCUUUGACAACUUGAAAUGUUACCACUUCGUCCUCAUGAUGUU +>U2AF2_K562_rep02_6005 +UUCAGCUUUAGCUGCAGCUGCCUCUGUUCAGCCACUUGCAACACAAUGUUUCCAACUCUCU +>U2AF2_K562_rep02_6006 +UAGCACCCCAGAUACUCGCCCAGCUGGUCUGGAAGAGGCUGAUCAGCCACCGUUGCCUGGA +>U2AF2_K562_rep02_6007 +GUUCCUCCCUCUUUUUUCCUAUGAAAGUUGACUAUAUAAUUAUUAAGCCAUUACCAGGAUA +>U2AF2_K562_rep02_6008 +CCCCCUUCUUGAGUGUUCCCCAUCGGUUUGUCCCCAGGGCUGCGCUGGCCUCGGCACACCA +>U2AF2_K562_rep02_6009 +CAUCGGUUUGUCCCCAGGGCUGCGCUGGCCUCGGCACACCAGUGCCACCCGCUGCCCCGGA +>U2AF2_K562_rep02_6010 +CCUUUUCUUGGCAGGCCCCUCGGGAGGCAUUGGCACAGACCGUGCUCGCAGAAGUGCCCAC +>U2AF2_K562_rep02_6011 +UUUUCUUCCCCCACAGUUCAUCCAUGAGCUCGGAUUUCCCACAUUACAACUUCAGGAUGCC +>U2AF2_K562_rep02_6012 +UCUCUUCUUCCCUUCUUUCUGGUUGGUGCUGCUGGGCCAGGUGGGAAUUUCUGAUUAAAUC +>U2AF2_K562_rep02_6013 +UCUAAUGCACUGUUUUAUCCUUAGCUUUGUUUGUUAUUAUGUUUUGGAAUGAAAUUUGGUC +>U2AF2_K562_rep02_6014 +UCUAGAAAGCGAAAUUAUUAUUGACGAUGGACAAUUUGGAAUCCACAGUAAGUGAGACUGA +>U2AF2_K562_rep02_6015 +UUUCUUUUAGGAGCUUACUCCACGGGAACAGCCUCUAGAUAAUCUGAGUUGUUGAAAAUAC +>U2AF2_K562_rep02_6016 +UGCGCUGGCCUCGGCACACCAGUGCCACCCGCUGCCCCGGACGCUGAGCGUCCUGAAGAGC +>U2AF2_K562_rep02_6017 +CCAUCACCCGCCUCUGUUUUCUCCCCAAGCUGAGGCAACUUCUCCUAGAAUCUCAAUCUCA +>U2AF2_K562_rep02_6018 +AGGCUAACUCCUUUCUGACCCGUUCAUCCCACAGGCCCUGGAUUAUUGUCACAGCAUGGGA +>U2AF2_K562_rep02_6019 +UCAUCCCACAGGCCCUGGAUUAUUGUCACAGCAUGGGAAUUAUGCACAGAGAUGUCAAGCC +>U2AF2_K562_rep02_6021 +UUUGUUUGCCUUGUUGUAGGUGGACCCAAGAGCCAUAUCAGUGCUAGCAAAAUGGCAGAAU +>U2AF2_K562_rep02_6022 +UUUGUUUGCCUUGUUGUAGGUGGACCCAAGAGCCAUAUCAGUGCUAGCAAAAUGGCAGAAU +>U2AF2_K562_rep02_6024 +CUCUGUUUUCACUCUCAGGCUCUGGUAAGUAUUCGUAUUCUCUUCAUCCCAGUCUGAUUGC +>U2AF2_K562_rep02_6025 +CAAAUCAUCCUACUCCCAAAUAGGCACCCACUCACUACCUUGGCGUCGUUUUUUGGGUCUG +>U2AF2_K562_rep02_6026 +UUUUUCUUCUCAGGAGGAAAAAAAGCAAGAGCAGAAGUCGUAGUCAUGAACGAAAGAGAAG +>U2AF2_K562_rep02_6027 +CUUCCCUGUUACCCCCAGAGCAGAUGCCCUCAUGUGUUCUGCGUAGAUCCCCAGCUGAGAA +>U2AF2_K562_rep02_6028 +AGCUUUCCUUCCAGGUGGGAGCAGCCUGCAUCCUGGAACUGCCAUCCCAGGGUAGGUCUGC +>U2AF2_K562_rep02_6033 +GUAUUUUAUUUUGCUAGGUGAGGCCCUGGUGACCACGUGAGAAAUGAUACCUGUCUAACCA +>U2AF2_K562_rep02_6035 +UUCUAUUUUUUUUUUCCCCCAAGCAGAGACCUAGAUGAAAUCGAAUUACCAAGCAUUCUUU +>U2AF2_K562_rep02_6037 +ACUAAAUUUUCUAUUUUCCUUAAAUUCUAGAAAGCGAAAUUAUUAUUGACGAUGGACAAUU +>U2AF2_K562_rep02_6039 +UCUCUAGCCCUAACCGGCAGCCAUUUGUUCUCUUUGGUAAUCACUCCACACGAGAAAACCU +>U2AF2_K562_rep02_6040 +ACUUCCUGGGACCUGGAGUGGGCCUCCUGACCUGGGGCUCGCUGGGAAGGGAGGGUUCCCC +>U2AF2_K562_rep02_6046 +AGUCAUCCCACAGGCCUCGCGGACGAAGGGGUGCCUGAAGCUGUGGAGAGGGUGCACAGGG +>U2AF2_K562_rep02_6047 +CUGAUUGCAUAGCCACACUGCCCGGCACGCCACAUCCACCCCUGUCUGCACAUGAGUUGUU +>U2AF2_K562_rep02_6049 +UUGUUUUCUUAAUUCCAGACUUUCUGUUCCAGAUCUCACUCCAAACAUUGGUCUUUUCUGG +>U2AF2_K562_rep02_6052 +ACUUCAGCAUUCCUUGAAGAAAAGAGGAACCCGCUCCCUGGGGAAGGCCGAUAAGAAGACU +>U2AF2_K562_rep02_6053 +UGUUUUUGUUCUUUUCCCCUAGUCACGAACCCCCGCCUUGGUUUUUGAACACGUAAACAAC +>U2AF2_K562_rep02_6054 +CAGGCUUAUCCCGUCCUGGGGCCCCAGUCCUCGGCCCUGUGAGCCUCACUUCCUCUAGGUC +>U2AF2_K562_rep02_6057 +GUCAUUUUGUUCAUAGGUUUCUAGACCAACUGGGGAGAUUCCCGUUAAAAAGUAUGUAUAC +>U2AF2_K562_rep02_6058 +CUCACAGCUGUCAGCUUCCCCUGGGUCAGGCCAGGGCCUCCUCAUGGCUCUGGGGUGGUUG +>U2AF2_K562_rep02_6059 +UCCCUCCUUCCUUCAUCAGUGUCCCCCAGAGCUCUGGACCUAACAGGUACUCAAUAUGUGC +>U2AF2_K562_rep02_6060 +UUUUCUUUUUACAGGAACGGCAGAGUCGAAACAAACAAUGAGGGCGAACCAGUUUCUUACA +>U2AF2_K562_rep02_6063 +UUUAACUCGUUCAGCAAAGCCUGUGCGGAGCGAGCCAGAGCUACCUGUGGAAGGGACCUCA +>U2AF2_K562_rep02_6064 +CCUCUGCCCUUCCUACACUGUCAAACUAGGUUUACCAUCUGAUUUUCAUACUGCUGACUUU +>U2AF2_K562_rep02_6067 +CCUUCUGUGCUGCCUCCCACCAGGUGCACCCCAGACAUGGAUGUCAUCCUCAACAUUCCUG +>U2AF2_K562_rep02_6074 +CUGUCAGUUUUCUCCCAUGAUCAGGGCUGAGCAGUACCAGUUCCGAAGGAAACAUCAUAGG +>U2AF2_K562_rep02_6075 +UAAUACUUUCUUACAGAGAAGAAGAAGUUGGAUGGGAUACCGAGAUUAAGGAUGAUGUGAU +>U2AF2_K562_rep02_6076 +GGAGAACAUGCCUGUAUUAAGGGCCGAGGUGGAAGAGCUCCAAGCCCAGACCCGGGAACCC +>U2AF2_K562_rep02_6080 +CUGCUUUCUCCCCUAUCCCCUGUCUCUACCCCCAGGCACAUGGCCACCCACUCAGCCCAGA +>U2AF2_K562_rep02_6081 +GGGUGUCUUCCAACCUUUUCUUUGUAGAACACAACUUUCCUGAACAGGAAAUCCAAGAGGG +>U2AF2_K562_rep02_6082 +UUUAUUUUGUGACUACGCCACAUGCUGGGUUUUCUUUUUGAAUUUAGGCAUAAAUGAAAUC +>U2AF2_K562_rep02_6085 +UUUUUCUGACAUCCAGGUAGCCCAGUGUGUCUCACCAAAGGGACCUCUUGCUUGUUCGAGA +>U2AF2_K562_rep02_6087 +UUAUACAAGCAAGAGCAACAGCUCUAUAUCUGGAUCACUGCAGUGCCUAGAAGAUACAACA +>U2AF2_K562_rep02_6090 +GACUCUUCUUCUUCCCAGGCUCAGGCCCGAUGUCACCGCAUAGGCCAGAGCAAAGCUGUGA +>U2AF2_K562_rep02_6098 +CUCCUCCCUUCACUUCACCAGGGGCGACCUGACGGAAGAUAACAUGGAGACAGAAAAUGCA +>U2AF2_K562_rep02_6099 +AUUUUGCUUUCUCUUUCACUAGGAUGGAAUGUGGGAUGGUAACUUAUCAACAUAUUUUGAC +>U2AF2_K562_rep02_6105 +UGCAGGUUAUUGAGGUGGUGAUCCGCUCAGAAGAGGGGCUCUCAAGGGACAUGGUGAAACA +>U2AF2_K562_rep02_6106 +UCUUGUUUUUUUUUCCGUUUGACAGAAACUGAUAAAGCUGACUUGAGUGGUAUUUAAAUAU +>U2AF2_K562_rep02_6107 +UUUUUUUUCCUUGCCUUAGCCCCGUCGCAGAAUUUAGUCUCAAAGGAAACUUCAACCACAG +>U2AF2_K562_rep02_6108 +CGCUCAACUGUUGGCCCCACAGGGACAAGGAGACCAGUCGCGACGAGUUCAUCUUCUACUC +>U2AF2_K562_rep02_6109 +AGCCCCAGGAAGCCUUGGUCGGGGGCAGGAGGGAGGGUCAGGCAGGGCUGGGGGCCUGAC +>U2AF2_K562_rep02_6110 +CAGCCCCAGGAAGCCUUGGUCGGGGGCAGGAGGGAGGGUCAGGCAGGGCUGGGGGCCUGAC +>U2AF2_K562_rep02_6117 +CCCUGAUUUUUCUGUACCUUGGCUACCACAGGUUCUGCUGAAUGUCCUGACCUUGAACCGG +>U2AF2_K562_rep02_6118 +AUGUUUUUGCCCUCUGUUGCAGUUGCAGGAUGUGAGUUUGAAUCUAUGGAAUGUCUACAGC +>U2AF2_K562_rep02_6119 +CUUUUAGGACUUGGCAGCAUUAGGCUGGUGCUCAGACGAAGAGGAGAAGAUCUUCAGGAAG +>U2AF2_K562_rep02_6120 +UUUAAACUCUCCUUAUCUUCCCCCCCACUUUCUUCCUCACAAAAAGAAUCUUACAGCUGCU +>U2AF2_K562_rep02_6879 +UCUCCUUCUUUCUUCCAGGGGCCGGGCUAGAGCGACAUCAUGGUAUUCCCCUUACUAAAAA +>U2AF2_K562_rep02_6880 +UCUCCUUCUUUCUUCCAGGGGCCGGGCUAGAGCGACAUCAUGGUAUUCCCCUUACUAAAAA +>U2AF2_K562_rep02_6881 +GGCCCAGGGAGUGGGGCAGGGGGCUGCUUAUUCACUCUGGGGAUUCGCCAUGGACACGUCU +>U2AF2_K562_rep02_6882 +AACUGCUGAGGAGGGACCUGCUUUGGGGAGUAGGGGAAGGCCCAGGGAGUGGGGCAGGGGG +>U2AF2_K562_rep02_6883 +CUUUGCAGGUUUCUGUAGCCGGAAGAUCUCCGUUCCGCUCCCAGCGGCUCCAGUGUAAAUU +>U2AF2_K562_rep02_6886 +GGAAGGGGGGAGAAUCCCAUAACUAACUGCUGAGGAGGGACCUGCUUUGGGGAGUAGGGGA +>U2AF2_K562_rep02_6887 +CAACAGGCCACAACAUCUAUUCCAAUAUAUUAGGUUUCCUCGGUGGUGUUUCCUGGGCUAU +>U2AF2_K562_rep02_6888 +UCUUGGCCUCAGGCUCCUGUUCUGGAUGUCAGAUAUGCAUCUGCCUCCUGAGAAACUGGUG +>U2AF2_K562_rep02_6889 +UUUUCUUUCAGAGCUGUUGCGCAGCCAUUGGUACCUGUAUUGGGGAAACAUAGCAUACAAG +>U2AF2_K562_rep02_6890 +CUGCAUAUUUUCCCCUUUUGUGAACAGGUACUGGUGGAGAAUGGAACAAAAGCUGGGCACA +>U2AF2_K562_rep02_6891 +UUUUUUUUUCCCCUCAGGUGGCGACAUGUCUAAGAAUGUGAGCCAGUCACAGAUGGCAAAA +>U2AF2_K562_rep02_6892 +GUCAAGAAGCAGGUCUCGAUCCCGGACCAGAAGUUCCUCUAGGUCUCGUAGCCGAUCCCGU +>U2AF2_K562_rep02_6893 +UUUUUUCCUCUCUUUUGACCUCCCCAGACCGAGUGACGGUUCUCUACAGGAGCAAAGCCAU +>U2AF2_K562_rep02_6894 +CAGCGGCUCCAGUGUAAAUUCCCCUUCCCCCUGGGGAAAUGCACUACCUUGUUUUGGGGGG +>U2AF2_K562_rep02_6895 +CAGCUACCAUUCAUUUCCUGAUUUCAUUUAUAGGUCUUACCAGGCAAGAAGGCCAAGCAGA +>U2AF2_K562_rep02_6896 +UGAUGUUAAACCUGGGGGGAUUUUUGUGUGUUCUUUCCCUUUUUCUUUCAGAGCUGUUGCG +>U2AF2_K562_rep02_6897 +GCCUUUUUUCCCUUUUAUUUGGAGGGAAUGGGAGGAAGUGGGAACAGGGAGGUGGGAGGUG +>U2AF2_K562_rep02_6898 +CCUUCACAGUAACUGGGGCAGGGGCCUACGGGGAGGGGCUUGUACUGAACUAUCUAGUGAU +>U2AF2_K562_rep02_6899 +CCUUCACAGUAACUGGGGCAGGGGCCUACGGGGAGGGGCUUGUACUGAACUAUCUAGUGAU +>U2AF2_K562_rep02_6900 +UUCUCCCAAGCCAAACUGGCAAGACGCAGUCAAGAACGGGACAAUCUUGGCAUGUUGGUCU +>U2AF2_K562_rep02_6901 +UUUUAAAAAAAAGAUAUACUGUGGAAGGGGGGAGAAUCCCAUAACUAACUGCUGAGGAGGG +>U2AF2_K562_rep02_6902 +AUUUGGAGGGAAUGGGAGGAAGUGGGAACAGGGAGGUGGGAGGUGGAUUUUGUUUAUUUUU +>U2AF2_K562_rep02_6903 +UUCUCUUAGCUGGAUGCUAGUGAUUCCAGUUCUAGCAGCAAUCUUUCACUUGCUAAGGUUA +>U2AF2_K562_rep02_6904 +CUCCUCCUUCAUCCUUAGUUCCAAACUGCUUAUCACUUCCCUGUUCCAUAGGCCACUUAGG +>U2AF2_K562_rep02_6905 +ACAAAAGCUGGGCACAGCCUUCUCAUGGAUGCCAGGGAUCUGGUCCUUAAGGUAAGGCUUC +>U2AF2_K562_rep02_6906 +UUCUUUAAUUAGGCUCACGAGGCCCAGGGAAUCCUCUGGACCAUCAGAUUACCAAUGAAAG +>U2AF2_K562_rep02_6907 +UUCUUUAAUUAGGCUCACGAGGCCCAGGGAAUCCUCUGGACCAUCAGAUUACCAAUGAAAG +>U2AF2_K562_rep02_6908 +ACCUCUUUUCCCCUAUGCAGCAGGAACUCCAGAAGAUAAAAUGAGGUUGUUUCUUAUCUAU +>U2AF2_K562_rep02_6909 +UUUUUUUUUUUAACCAGCAGGAGAGCAAAGGGAGAAAGCUCUAGGCUAAAGGCCAGAAGAC +>U2AF2_K562_rep02_6910 +UCUUCUUAGGUUUAUCGGCGGGGGCUUCAGGCAAUACCUCUUAGUGUUGACCUUUGGAUAC +>U2AF2_K562_rep02_6911 +UCCUUCUCCAUGGACGGUGCGGAGGCCUGGGCCAGGGCUGACUCCCUUCAGGAGUGGAGGC +>U2AF2_K562_rep02_6912 +UUCCACCCCACUUCUUUUGGCAGCUAGGUGCUGAGACAGGUGUGCAAAGUUCUGACCUUCA +>U2AF2_K562_rep02_6913 +CAGACCGAGUGACGGUUCUCUACAGGAGCAAAGCCAUUCGCUAUACCUGGCCUUGUCCAUU +>U2AF2_K562_rep02_6914 +GAGACUGAUGUUGACACACUUUUUUUCCAUUUGGCAGGAAUGGGAGUACAGUGCCAUUAGG +>U2AF2_K562_rep02_6915 +CAUUUGGCAGGAAUGGGAGUACAGUGCCAUUAGGACCAGCAAGUGACACAGGAAUUCUGAA +>U2AF2_K562_rep02_6916 +UCUUUUUUUAGGAAAAUGUCUGAUGAAUUUUCGGUAAGUUGAUCAGUUUAUCUGUGAUAAG +>U2AF2_K562_rep02_6917 +AAACUUCCUUUUGGCAGAUGUGGCCUCAUGGAUGAGCUGGUACACGACUUAGCCUCAGCCU +>U2AF2_K562_rep02_6918 +CCCUUUUCUUCCUUCAGCAGAGGCCAGGCUAUGGAGCAGGGCCACUGAAUUUGCUGUAAUC +>U2AF2_K562_rep02_6920 +AGUUAUGUUUCACUCUAGGGAACAAGUCCUGAAGAACCCUCAAGCCCUAAAGUACCACCUC +>U2AF2_K562_rep02_6921 +GUAAAAAAUUAUUUUUUCCUGAUAGCUGGCCCGGUGAUCAUGUCCAUUGAGGAGAAGAUGG +>U2AF2_K562_rep02_6922 +GUAAAAAAUUAUUUUUUCCUGAUAGCUGGCCCGGUGAUCAUGUCCAUUGAGGAGAAGAUGG +>U2AF2_K562_rep02_6923 +AUUCUCUCUUUCCCCUUAUUUCAGGUCAGAAGAGGCCAAGUGAUGGAAAUAGUGGAUUAAU +>U2AF2_K562_rep02_6924 +UUUGCCUUCUAGGAUUCUUACAGAAGCAGAGAUUGAUGCUCACCUUGUUGCUCUAGCAGAG +>U2AF2_K562_rep02_6925 +UUUGCCUUCUAGGAUUCUUACAGAAGCAGAGAUUGAUGCUCACCUUGUUGCUCUAGCAGAG +>U2AF2_K562_rep02_6926 +UUUUUCUUCCGUGUCCUCUCCUCUCCCGCAGUGAAGUUAUUCGAAGUCAUUGAAACUGAAA +>U2AF2_K562_rep02_6927 +ACGUUUUUUUCAGGAUGGCACUGGAUCUUUAAAACGCAGUGGUUCCUUUAGCAAACUCCGG +>U2AF2_K562_rep02_6929 +ACUCCCCCUUUCUUCCAUCCCUCAUCCAUUCCUUUAGGUAACUACUAUCCUGAAGUUGAGA +>U2AF2_K562_rep02_6930 +UUUUCACCCUUCCUGUGUUCUUGGUGGGGUUUCCCCGACCUAUUCAGAGUUGGCCAGGAGC +>U2AF2_K562_rep02_6933 +CUCUUUGUUGGCAGGUGCGUUAAACCUCUACAGUUUGUCAAGCUUUGCAGUGCAAGCCUCU +>U2AF2_K562_rep02_6934 +UUUUGUCUUGAUGUUUUCCCUCUAGGCUGAAAAUCUAUUGUUAGAUGCCGAUAUGAACAUU +>U2AF2_K562_rep02_6936 +UCCUUCUAUUUCUGCCCUAUUUUUUUCCAGGAAGAAAAAAUGCUGGGCAUCUUGGUGCAGC +>U2AF2_K562_rep02_6939 +CACAGUGUCCCCAUGAACUCCCUUGUCCCCAGUUGACCAACCUGGCCUGUAGCUUCUCACA +>U2AF2_K562_rep02_6940 +CUUAGAAUGGUCCUUCUCUUUUGCCCCUACCUAGUCUUUUAUCACGAGUCAUGAAUACAGG +>U2AF2_K562_rep02_6942 +UGCCCCUACCUAGUCUUUUAUCACGAGUCAUGAAUACAGGAUCACAGUUUGUGAUGGAAGG +>U2AF2_K562_rep02_6945 +GCACUUUGUACUUAGAAUGGUCCUUCUCUUUUGCCCCUACCUAGUCUUUUAUCACGAGUCA +>U2AF2_K562_rep02_6955 +GUCAUGUUCCUUGUCUUGGUCCUCAGGUGCAGUUUGAUGUAGUAGUGUCAGCUUUUUCCUU +>U2AF2_K562_rep02_6960 +UAUUUUCUAUGACAGGCUGGGCGGGGAGCGUCGGACCAGAAGAGAAUCACGCCAGGAAAGC +>U2AF2_K562_rep02_6961 +UUUGCCAUCUUAGGGCUGCUCACAGUAUUUGGGGCCAGAGCCUACGUGAAUAUAUGUGUGU +>U2AF2_K562_rep02_6962 +AUUUAUUUCUAUUUUUAGUGGGAAGAUCCUGGCUGUAAGGAUGAAUAAUGUUAAGUUUAAA +>U2AF2_K562_rep02_6963 +UAUUUUAAUUUUAGGUUCUAUUUUGUGGGUGAUGAAGAUUUGCUUGAAAUCAUUGGAAACA +>U2AF2_K562_rep02_6964 +UUCUUUUUAGGACUCCUUCUCCCUCUAUGAUUGCUCUUACACAGCUACUGACAUUUAUACU +>U2AF2_K562_rep02_6966 +UCUUUUCCCCCUUCCCCAUCCUCUUUGUCUCACAGGAACAACUUGAUACAGAGACAAGUAC +>U2AF2_K562_rep02_6967 +UCUUAAGUUUUAAGCAGGGUCUGAAAACCCUUGGUGUUUUGGAGAAAAUUCAGGCUUAUCC +>U2AF2_K562_rep02_6968 +UACGGCUCUGUGUUUGUCCCUCAGACAAGUUGGAUGGCUUGAGGACUGGUACUAAAAGGAA +>U2AF2_K562_rep02_6969 +UUUUCUUCAGCUCCCAUUGCUAUCACAUGUUUUACCAGAGGCUUGGACAUCAGGAAAGAGA +>U2AF2_K562_rep02_6970 +UUCCAUUUAAACAGGGUUAAUUUGGAAGAAUCUUCAGGAGUGGAAAACUCUCCAGCUGGUG +>U2AF2_K562_rep02_6971 +UCCUGUUAUUCUCUCCCUCUCUUUAGUUUCUGGUUACCAUCAGCUGGGAAAAGAGAACGAA +>U2AF2_K562_rep02_6978 +UCUCUCCUUCCCUCCUGUGAACGUCUGUGUCAGGCAGUGUGUUAGUCACUGAGGUUUUGCU +>U2AF2_K562_rep02_6986 +UUUUAAGGUAUGAUGAGUGGGUGAAGGCUGACAGGAUAAUCUGGCCUUUGGACAAAGGUGG +>U2AF2_K562_rep02_6987 +UAACUGACCUUGUCUACAGAACUAGACAGUACGGAUGGUGCCAAAGUUUUUAGUAAACAAC +>U2AF2_K562_rep02_6988 +UCUUAUUUCCACAGGCAUUCGUUUUGCUCAUCUUUGGAAUUUUGGUUGGGAAUUUUAGUUU +>U2AF2_K562_rep02_6989 +AAUCUCUUUGUACCUGCAGGCCGCAUUGACAGGAAGAUUGAGUUCCCCCUGCCUGAUGAAA +>U2AF2_K562_rep02_7000 +UUCAUAUUUGUCUUCAGUUACAGGUUUAUGAUAAUGGAUCGCUUUGGGAGUGACCUUCAGA +>U2AF2_K562_rep02_7001 +CUGUUUGUCUUUCCAGGCUUGUUUUGCAGAGGGAGAAGCACUUCCAUUAUCUGAAAAGAGG +>U2AF2_K562_rep02_7002 +CUGUUUGUCUUUCCAGGCUUGUUUUGCAGAGGGAGAAGCACUUCCAUUAUCUGAAAAGAGG +>U2AF2_K562_rep02_7003 +UUUCCAGGUGGUUCGCUUUGAGGUGGUCUGAAGCCAAGGCCUCGCGGAGCUUCUUUGUGUG +>U2AF2_K562_rep02_7004 +UGAUUUCUUGCCCGUCCCCUCCCUCCUUCCUGCUGCGACUGUGGGACUGUGGCCCAGGUGU +>U2AF2_K562_rep02_7005 +ACUGUUAUUUUACAGGCUUUCUUGGCUACACAAGUAGUUUAUCAUUUUUCUUUAUGAUGUU +>U2AF2_K562_rep02_7008 +CCACUCCCAUCUUGCAGGUGCAGGAGCUCCAGUCUCUAGGCUUUGGGCCUGAGGAGGGGUC +>U2AF2_K562_rep02_7009 +CACUCCCAUCUUGCAGGUGCAGGAGCUCCAGUCUCUAGGCUUUGGGCCUGAGGAGGGGUCU +>U2AF2_K562_rep02_7010 +UUAGGUCUUGCUAUCACAGAUGAAAUUUUGCUGAGUAAGGCAGAGUGGUCCAAACUUUUUG +>U2AF2_K562_rep02_7011 +CUUUCUCCCCAGGAACGACUGAAGCUGGUGACUGUUUUGGGUGCUGGCCUUCUCUGUGGAA +>U2AF2_K562_rep02_7012 +UUUUUUUUUUUUAGAUUACAGGUCCACCAGGUUGUGGAAAAACUCAGUUUUGUAUAAUGAU +>U2AF2_K562_rep02_7013 +CUUUUCUUUGCAGAAAAAGAAAGAAGAGGGUGUUAUUGAUUCAUCUGACAAAGAAAUCGUU +>U2AF2_K562_rep02_7014 +GUAGCUCUGUUUUCAUAAACAGGAAGAAGAGGAGGAUGAUGACUGGGGAGAAGAUACAACU +>U2AF2_K562_rep02_7015 +UCCAUAACAUUCCCUUUUUAGCCUCAAGAACUUGCUGCUUUUUCUGGAAGAAAUAAUUCAU +>U2AF2_K562_rep02_7016 +UCUUAUGUUUUCCUUCCCAGGAGUGGACCUACCCUAUGAGACGAGAGAUGCAGGUAUGGCA +>U2AF2_K562_rep02_7017 +UACUUUUUCACUGUUAGCUUGUGUUUUCUGUCGAAAACAUGAUGACUGUCCUAAUAAAUAC +>U2AF2_K562_rep02_7018 +GCCAAUUUGCUUUAUCCUUCUCUUCAUAGGUUUCUUCUGAAAUGUUUUGCUAGUAAGUUGC +>U2AF2_K562_rep02_7019 +AUUCUCCCACCCCCCAAACGUUUUCUGCUUUUUUUAGCUCAGCCUCUUUAACCUUGAUGGA +>U2AF2_K562_rep02_7020 +UUUUUGUUUUUUUUUAUGAUGUGGGUUAGGGAUAGAACUUCAUUUUCUUUUAAAUUUAUUU +>U2AF2_K562_rep02_8478 +CCCCUUUUUCUUCUUCAUACAGAGCUCGCUGCCCAAAUCAUUCAAGAGGAAGAUCUCCGUU +>U2AF2_K562_rep02_8479 +CGCUGCCCAAAUCAUUCAAGAGGAAGAUCUCCGUUGUCUGUAAGUCCAGCCCCAAAUCCCU +>U2AF2_K562_rep02_8481 +UUUUUUAGGUACCAGCAUCAAGAUGAUUUAUGGUAAUAAGGUACUCAGUCUUUGCUUAAAA +>U2AF2_K562_rep02_8482 +UUUUUUUAGGUACCAGCAUCAAGAUGAUUUAUGGUAAUAAGGUACUCAGUCUUUGCUUAAA +>U2AF2_K562_rep02_8483 +CCUUUCAUUUUCUACGACCGCGAGGACUACGGGAUCAUGAAAAUGAAGAUCGUGAUGCUCA +>U2AF2_K562_rep02_8484 +UGCUAGAUUUCUAACGACCCAAGUCCAGGAUACAACAUUGAACAGAUGGCAAAGCGGUAAG +>U2AF2_K562_rep02_8486 +UUCAAGAGGAAGAUCUCCGUUGUCUGUAAGUCCAGCCCCAAAUCCCUGAUAAAAGUCAGGA +>U2AF2_K562_rep02_8487 +UGUGGGGUGUCUCUCUUUCUCUUUUUUUUCCCCUUUUUCUUCUUCAUACAGAGCUCGCUGC +>U2AF2_K562_rep02_8488 +UCUAGCAUUUGCUUUCCCUUCUAGGUCUCCUUAACAGCAGCAGCAGUGUUUUAAGGUAGAU +>U2AF2_K562_rep02_8489 +AUCUUUAUUCCCUUCUUUCCUCUUCCAGCUGAGCAGAGUUGGAUAAUUGAAUUAGUCAUUC +>U2AF2_K562_rep02_8490 +GCCUUUUUCUGGUGUGUGUUGCGGGGGUGGGGGCCGGUGAAAGUGAUUUGAUGUGCAGAAU +>U2AF2_K562_rep02_8491 +UAUAAUCCCUUUAGUCCUCUUUUUUUCAGUUUUUAUGAAGAACAGUUUGUCAGCAUCUUCA +>U2AF2_K562_rep02_8492 +UCUUCCCAUUCUCUUUCUAGGAUCUUCUGAGGUCGGAGCUUCCAGAUUCAAUUGAAAGUGC +>U2AF2_K562_rep02_8493 +UUUUUUCCUUCGCACAGGUCCUCUGGUGAUGUUCUUGAGACGUUCAAUUUCUUAGAAAAUG +>U2AF2_K562_rep02_8494 +UCCUUCUUCCCCGUAAAACUUUGUCCAAGUACCUCAUGUACGGUAAUCCGCCCGUAAAAUA +>U2AF2_K562_rep02_8495 +CUUCCAUUCCCUCCUUCCUUAUUUUUUUCUUCUGCUAGAUUUCUAACGACCCAAGUCCAGG +>U2AF2_K562_rep02_8496 +UUCUGCUUUUCUUAUCAGCACUGUUCUGCAGGCAAAGUCAUGGCAAUUUCCUUAAAGUUAU +>U2AF2_K562_rep02_8497 +AGACCAUGGUUGGUCUGCUUCCCUCACUCGGGCUCCUUGACAGUCUUCUAGAAGAGAGAAG +>U2AF2_K562_rep02_8499 +AACCCAACCUCAGGUCCAGAUACUUCGUCUGCUUCGGAUCCUGGGCCGGAACCACGAGGAG +>U2AF2_K562_rep02_8501 +CUAUUGGGGCGGGUGGGCAGGAAUGGACCUAGGGGAAAGAGUAGAGCACUCUAGUGAUCCC +>U2AF2_K562_rep02_8503 +UUUUCCCCCACCAUUAGAUAUUGAAAAAGUACUUGUUUCUCUGCAGAAAGCAGAAGACUAU +>U2AF2_K562_rep02_8504 +UUUUUCCUCUCUUCCUACAAUAGCGGCCCUGUUCUGUCAUUAGCUAUUAGUUCUAAUGGAG +>U2AF2_K562_rep02_8505 +GUUUUCUUCUUUUUCCUCUUCCUCUCCCUCCCUUUUUUCUAAAAAAUUAUAGCUAAAGCCU +>U2AF2_K562_rep02_8507 +UUAUCUUCUAUUCCCUCCUCCUAGGGUCAUCACACUGAAACGGUGUUCAACCGGGUUUUGC +>U2AF2_K562_rep02_8510 +CUUUCUUUUCCUCCAUCCUGCCCCUUUUCUUCAGUAUUUCAUAGCCUUAAUUGAACAAGUU +>U2AF2_K562_rep02_8511 +CUUUCUUUUCCUCCAUCCUGCCCCUUUUCUUCAGUAUUUCAUAGCCUUAAUUGAACAAGUU +>U2AF2_K562_rep02_8512 +CCAUAGUGGACAGAGUUCACAGACCGCACUUUGGCACGUUGUCCUCACUGCAGGAAAGUGU +>U2AF2_K562_rep02_8513 +CUCUCUUAUUCCAGGAAGAGCAACCGAGGUUUCAAUCUGCGGUACGUCUCCUACUCUCCAU +>U2AF2_K562_rep02_8514 +UUUAUUUUUCCUCCCAACUUUUACUUUAGGUUCAGAAGGUAUGUGUGCAGAUUUGUUUCAU +>U2AF2_K562_rep02_8515 +UGUUUUCAGCUGCCCUAUGAUGACUGUGUGUUUGGAGGCCAGCGUCUGACGUUAUGAGCGC +>U2AF2_K562_rep02_8516 +UAUUUGAUUCUUUGACAGGCCAGCCACAUCCUGAAGAUGUACUACUGUUUGCCAUUCCAAU +>U2AF2_K562_rep02_8517 +AAAAAAUUAUAGCUAAAGCCUGGAGAAAAGCCUGUUCCAGGUAUGGUUCAUGUAAUAUUCU +>U2AF2_K562_rep02_8518 +UGGCCUCACACACCUCUGUUCCCCUCCUAGGACCAAGGGACCUGUGGAGGUGAGGAGGUGG +>U2AF2_K562_rep02_8519 +UGCCUUGCUUAAUCCCAGGAACCUGGCCACUGCUCCUUGGUCCUUGGCAUUAUGACGGGAU +>U2AF2_K562_rep02_8520 +AUUUUUCUUUUGAUUUCAGAGAACACUUUUUACAGUUGGCUAGAAGGUAAUUAGAAACUUU +>U2AF2_K562_rep02_8525 +CUUCUUCAUUCAUGUUCAUCUCUGCUAUUCCUUCUCCCUCCAGAAGGGAUGGAAACCCUAU +>U2AF2_K562_rep02_8533 +UUUAGCUUCUCCUCUUAUGGGUGCUCAGAGUUUCCCUAAUUUGACCACACCUGGUACUACA +>U2AF2_K562_rep02_8534 +AUUUUUUCCCUUCCCCUCCUAAAACAUCUCUAAAGCAGAAAAACUCAAUAUUGAUCAGGUG +>U2AF2_K562_rep02_8537 +GUUUGUUUUUUCCCCAGAGCCAAAUGUUCUAGCUGGCACUUUAGUUGGUCAUACAGAUGCA +>U2AF2_K562_rep02_8538 +UUUCUGUUACUUCCCCCCAGGAGCGAAUCCGUUUAGCUCGACAGAUUGAGAAAUCUGAGUA +>U2AF2_K562_rep02_8539 +UCUUUUAUAGCUUCAGCCCACUUGGGGAGAGUUCCUUGAUCAUCAUAAAGAACAGCCAGUA +>U2AF2_K562_rep02_8541 +UUUGUCGUUAAGGGUGAUCUGCCAGAUUGCGAAGCUGACCAACUCCUGCAGAUGAUUAGGG +>U2AF2_K562_rep02_8545 +UGUUCUUUUAUUUUGCACUAGGGAGAGGAAAUUCGAUGUCAGUAUGUUGUGACAUGUGCAG +>U2AF2_K562_rep02_8550 +GUCUUUAUAGGAUCUUUAAUGACUUGCUACUGUGGGAACCAACAGCUCCUUCACCAGUGGA +>U2AF2_K562_rep02_8552 +UUUUUUUUUCUUAGACGUUCCAUCCUCAGAGCAGCCUGAACUGUUCCUAAAGAAACUUCAG +>U2AF2_K562_rep02_8558 +UUUCUUUUUUAUAGAGGACCCACAGGCAUGAAUUAUUUACUCCUCCGGUGAUAGGUUCUCA +>U2AF2_K562_rep02_8559 +AACUGUGACUUUGCCUUCAGUGAAGGCCGCCCUCCGUUUGGGAUUUCAUUCUCGUUGUCUU +>U2AF2_K562_rep02_8560 +UUAUGUUUUAGAUGGUGAUGCCAGGAGACCCUGUAGAAAUGACAGAAUUUCAGGAUAAAGC +>U2AF2_K562_rep02_8561 +AACUACUUUGCCUCCCUUCUCUGGUCUGGUGUCGUCCUCACAUAACAUGAGGGCCUGGAGA +>U2AF2_K562_rep02_8562 +CUGCAUGGAAACCUCUUUCUCCUGCCAGGAGAGCCCUGGAACUAAGCCUGGCUCUGGUAAA +>U2AF2_K562_rep02_8563 +UUUUUUUUUCUUGGCAGGGACUCACUCUGUUGCCCAGACUGGAGUGCAGUGGCACAAAGGA +>U2AF2_K562_rep02_8564 +UUGUUUCUUCCCAGUUUUGGAAUUCAAGAACACCUAAGGAUUCCACUGAUUUGCUGAUCUG +>U2AF2_K562_rep02_8565 +CCUACUUUAUAUAAGGGCAACUUCCUGGGAGCUAAGGCUACUAAAAGGUAGAAGCCACAGU +>U2AF2_K562_rep02_8566 +CCUACUUUAUAUAAGGGCAACUUCCUGGGAGCUAAGGCUACUAAAAGGUAGAAGCCACAGU +>U2AF2_K562_rep02_8572 +UCAGCCUUUGAAGUAAAUUUUAUGGAUGAUGUAGGUCAGACUCUAUUAAACUGGGCCUCUG +>U2AF2_K562_rep02_8573 +AGUCACUGCUUUUUCUUAGGUCUCUGUGUAGAAAAAAGAGCAUUCUACAGACUUAUAUCUG +>U2AF2_K562_rep02_8574 +AAUGUCCUUUUUUCGCUCUUCCUGUGUUAACGGCUGCUUUCCUUUCAUUUUCUACGACCGC +>U2AF2_K562_rep02_8575 +UAUUUCCUAGGUUCGUUCCACCAGUCAUAAACCAGAUGAAAUCUAUGGCAUGAUUGAAAGA +>U2AF2_K562_rep02_8579 +CCCCUUCCUCCCAACUUUUUCCGCAUUUCCCCUCCAGUUUCUAUCCUUUUCCCAAGGAAGA +>U2AF2_K562_rep02_8580 +UUCUCAGCCUUUUUUAGCAAAACUUCAGUCUCCGAUUAAAGAGGAGAAUACAACUGCUGUU +>U2AF2_K562_rep02_8581 +UUCCCCUCCCUUGCAAUGUAACCCACAGGCUGAGGAAUUCCUCUACAGAUUCUUGCCACAG +>U2AF2_K562_rep02_8582 +CUAUUUCAGUUGCUAGUGAUAUCUCGCUAACAGGAGGCUCAGUAGUACAGAGAAUACGGCU +>U2AF2_K562_rep02_10076 +CAUUUCUUCGUUUAUCCCCCCAGCAGCGCUGGAGAGCGAGGUGGCUUCAAUAAGCCUGGUG +>U2AF2_K562_rep02_10077 +CUUUAAGGCAGUAUUUUGAUCCCAUAGUAGGUGGAGCAGCCCUGCACACCCCCUCCUGUAU +>U2AF2_K562_rep02_10078 +UGAAUGGGCAAGAGGGCACAUGAAGUACGGCGUCCUCCACAUUCACGGCCUCUACACGGAC +>U2AF2_K562_rep02_10079 +UUAGGUGGAUUCUUGCUCUGUCACCCAGGCUGGAGCGUAAUGGCACAAUCUUCGCUCACUU +>U2AF2_K562_rep02_10080 +UUUGCAGGUAGAAGAAGAAAGGUGCCACUCCGGCAUGAAGACAGACUCGCUUAGUCGCCAG +>U2AF2_K562_rep02_10081 +UGUGUUUCUUUUUCUUGGCUUGAUGUUUGGUAGGUCCUUGAAUGGGCAAGAGGGCACAUGA +>U2AF2_K562_rep02_10082 +CCUUUCAUUUCGUUCCCCAGGGCACCGAAGCCAAAGCACUGUCCAUGCCGGAGAAGUGGAA +>U2AF2_K562_rep02_10083 +UUAUUUCUCCUCUUAGACCGCAGGAUGGAAACAAGCCCACUGAGACUAGUCAACCUCAAUC +>U2AF2_K562_rep02_10084 +AUGAUCUUUCCUGGUUGGCAGGACCCAUGGAUGAAGGACCAGAUCUUGAUCUAGGUAAUUU +>U2AF2_K562_rep02_10085 +UCCCUUGAUGACAUGGGGCUGGCUCUGGUUUUCCAGGUGUCCCCUCGUCCCAGCCACCUCC +>U2AF2_K562_rep02_10086 +UCUCUCUCUUUCAGCUAUUCCUCUACACAGCCGACUAGUUAUGAUCAGAGCAGUUACUCUC +>U2AF2_K562_rep02_10087 +UUCCUCCUUCUCCCCUCAGACCGAAGCCAGGACAGCACAGCCGUAGCACUCUCAGACUCUA +>U2AF2_K562_rep02_10088 +UGUCUUCCUGUGCAGGUCGUGGCCGCCCACCUACAGAGCCGCUGCCCGACGGGUGGAUCAU +>U2AF2_K562_rep02_10091 +CAUCCUGUUUGUUUUUCAGAUGAUCAUGCACCCUAAGGGCACAUCUAGGCCCCCUGAGAGC +>U2AF2_K562_rep02_10092 +GUUCACAGAGAUGCUGCAAUUUGUCAGUAAUCAAGUGGGAGAGUUCCCUGACUUGUUUUCA +>U2AF2_K562_rep02_10093 +GGGCACAUCUAGGCCCCCUGAGAGCACCUCCUUUCUGUGUCUGUUCUCAGGAAUGCUGUUG +>U2AF2_K562_rep02_10094 +AGGCCCGAGCAGGUACUGACCCCUUGUCCUUCCCCACAGCCGAGCCCAGGAAGUGCGUCCC +>U2AF2_K562_rep02_10095 +CCUAGCAUCUGUCCUGCCCGAGGUGCUGCCGGUUAGCCAGCGCCCUGUUGUGCCACAGAUU +>U2AF2_K562_rep02_10096 +GUUUGGCCCAUGGGUAGGCCCUGCAUCCCUGAUCUAGCGCGUGGGGCAGCAGGUGCUGCUG +>U2AF2_K562_rep02_10097 +CAGAUGUAUUUGGGUUGGUCGUCCUCCCAUUGGAACUGAAACUACGGAUCUUCCGACUUCU +>U2AF2_K562_rep02_10099 +UUUUUAAAGUUUCCUAAUGAAAAGUUUGGCCCAUGGGUAGGCCCUGCAUCCCUGAUCUAGC +>U2AF2_K562_rep02_10103 +GUCCAUGUUUGCCACACAGGGUCGGGUGUGCUGACAGCCGGCUGUUAAGCCCUGCCUGCCC +>U2AF2_K562_rep02_10105 +UUUUUAAACAGAUCUCCCACAAACAAAUUUUCGUCGUUUACCUUUUGACCACUGCAGGUAA +>U2AF2_K562_rep02_10107 +GUGUUUAGGAAUGUUCAACGCUCCAAGCCCCAUAGGCUGAUUCAAGAAGAUAAAGUGAGAC +>U2AF2_K562_rep02_10108 +GUGUUUAGGAAUGUUCAACGCUCCAAGCCCCAUAGGCUGAUUCAAGAAGAUAAAGUGAGAC +>U2AF2_K562_rep02_10110 +CUUCUCCACCUCUUGCCUGGUCCAGCUGGAGCAGAGUGAAGCCAAGUGUGAGGAGGCCUUG +>U2AF2_K562_rep02_10114 +UUUUCCUUUAGGUAGAUGCCCAGACUGCUGGAUUGAAUGCAGAUCUACUUCGAAAAAGUCU +>U2AF2_K562_rep02_10115 +CCACCACUUCUCUCCAUCCUGCAGGCAGCUGCCAGACCCGGCCAUCGAGGACCAGGGUGGG +>U2AF2_K562_rep02_10118 +UUCCUGUUUAACUCGUGCAGGUGCAGUGGUCUGGUGUCUUUCAGUCCGCUGACGUCUUCUG +>U2AF2_K562_rep02_10119 +CUCUAAUUUUUUCCCCAGGCCGUGGAGGAGCUCCUGGAGACCCUGGAUCUGGAAAAGAAGG +>U2AF2_K562_rep02_10120 +CCUGGGGACAGCUGGAGUUCCGGGGUCCCCUGGGCAGCCUUGGGGGCUAAUGACCUGCCCU +>U2AF2_K562_rep02_10121 +UCGUUUUUUUUUGGAGCAGGCAUAUGGGCAACAAAGCUAUGGAACCUAUGGACAGCCCACU +>U2AF2_K562_rep02_10125 +CCUUUGUUGUUCUUUCAGGAGGAGACUCGAAAGAAGCCCAAGAUGUCCAUUGUGGCGUCCG +>U2AF2_K562_rep02_10126 +AUCUUCCUACCCAGAUGCACAAGUCUGGCGUUCUGAGGAAGGCCAUUGAUUACAUCAAAUA +>U2AF2_K562_rep02_10128 +GCGAUUGUUAAAUCUAUUCGUGCCCUGAGAUGUAUGGCUUUAUGCUGAAGAUUGGCUGGAU +>U2AF2_K562_rep02_10129 +CCUUUUUCCCACAGAUCAUCACAGGUGCUAAAGUUUGGCAUUUGGGAACCACAUCCUAAUU +>U2AF2_K562_rep02_10130 +UCUUUCCAGUCUUCCCCUGAAGCAGGUGAAGCAGAAGUUCCAGGCCAUGGACAUCUCCUUG +>U2AF2_K562_rep02_10131 +UAACUGUGCUUCUUCCAGAAGCUGGACGGGAGGUCCCUGAUCAAGCUGAACUUUUCCAAGA +>U2AF2_K562_rep02_10133 +GAAACAUUUCCCCUUGAUCUCCCUAGGGGCAUCUGGUCUCCAAUAAGGCUGCUAUGGAUGA +>U2AF2_K562_rep02_10137 +GCAUUUUGUGACCGACUUAUUCUUAGAUCAUUGGUUUUCCAAAGGCUUUGUGGCCAUGAAG +>U2AF2_K562_rep02_10138 +CCAUCAUUGUGUCCUUUGAUCUUCACACAGCAGGUAUCAUCUGCAUUUUAUGGAUGAGGAA +>U2AF2_K562_rep02_10139 +AUUUUCUCUUUUGAAGAUGCCUUGCCCAGUGGCAUGGAAAGAAGCCCACUUGAUGAUAGGA +>U2AF2_K562_rep02_10142 +UCACAAGGGGCUGGGGUCAGGUUUGGGCUGUUGACGCCUCGGGUCUUCCCUCCAGGUUUGG +>U2AF2_K562_rep02_10143 +GUUUUUAUCUUGCUGUACCUGUAGGGAAUGUUUAAUUCAGCCUUGGAAGUGGCCAAAUUUG +>U2AF2_K562_rep02_10144 +GUUUUUAUCUUGCUGUACCUGUAGGGAAUGUUUAAUUCAGCCUUGGAAGUGGCCAAAUUUG +>U2AF2_K562_rep02_10145 +CUCCACUGCCUUCUCUUCUUCCAGGUGGGCCAUCGUUGGACUAACAGACCAGUGGGUGCAA +>U2AF2_K562_rep02_10152 +UCUCUCCCCCAUAGAGGAGGAGCUCCGGAAGCUGCGAGAAGAAACCAACGCGGAGAUGCUG +>U2AF2_K562_rep02_10160 +UCCAGCUGCACUGGGCACAUUCCUCCCCUCACCCUGACUCACAAGGUGUUAGCAAUAAUGG +>U2AF2_K562_rep02_10161 +UCUUUCCUGUUUUUCUUAGGGUCAUAGUGUGCUGAAUUAUAUUGUUAUGAGAUAACACUAG +>U2AF2_K562_rep02_10163 +UGGGCAUUCUCUUUUUGCCACAGGACCCCACCAAUUUGGACAAGUUCAAUGUCUCUAACUU +>U2AF2_K562_rep02_10164 +CCUUGGUAUUUGUUGUAAAUUCUCCUUUCACAGCGAUUGUUAAAUCUAUUCGUGCCCUGAG +>U2AF2_K562_rep02_10165 +UGGAAAUUGCCUUAUUGGAAAAACAUUUCUUACGUGAGUACCAGAAAGCGCUUGGAGGGGA +>U2AF2_K562_rep02_10173 +ACCACAUCAGCAUCGAGGACUCGCGGGUCUACGAGCUGACCAGCAAGGCUGGGCUGUUGUC +>U2AF2_K562_rep02_10174 +UGGCUGUAGAGGGUGGGCAGCUCCUGGUGUGCUCUUAGGCAGGCCAGGUGCAGAAGGUGCC +>U2AF2_K562_rep02_10182 +CAUUCACGGCCUCUACACGGACCCCUGCGGGGUGGUGCUGGACCCAUCGGGGUAUAAAGAC +>U2AF2_K562_rep02_10183 +GCACUUCCCUUGCAGGGCUCCCUGCGGACUGCCGUGGCCGCUGGGAGAGCUUCGUGGAGGA +>U2AF2_K562_rep02_10194 +UCUCAUGAUCUUCUUACAGAUGGAGGGCCGGCGCGACAGCAUGCUAGAGACAGCCAAGCAC +>U2AF2_K562_rep02_10195 +GGUAGAAAAACUACAUAGUGGUGGCUACUGUGCAUCUCUUCCUAACUCCACAUUUGACAAC +>U2AF2_K562_rep02_10196 +GGGCCUGAGGUCGACCAGGAAAGGCCUGUGCCCCCUCCAAGGGCCCCUCUCUUCUACCCAG +>U2AF2_K562_rep02_10197 +AGGGUGACAGCUGUGUUUGCUCCCAUGACAGGAUGAAGGACAUGCGCGUGCAGACUUUCAG +>U2AF2_K562_rep02_10198 +UUCCUUCUUUUUUCCAUUGGUUUAGAUUUUUGUUCUUGGUCUUCAGUUUUAGUAUUAAAAU +>U2AF2_K562_rep02_10208 +CCUUCUUCCCUCCGGCAGAACCAGAGCUGGGGUCUGGGGCGGGCCCUGCCGGCACAGGCAC +>U2AF2_K562_rep02_10209 +CCUGUCUUUUCCCUUUCCCCCGCUGUCACCCCUGUCUCCGUCCAGCCCUUGUCCCUGUGGC +>U2AF2_K562_rep02_10210 +UUUUUAUUUUGUCUCCUCUGUUUUUGUUGCUUAUCUCCUUGUAUUUUUAUUAUUAGUUUUG +>U2AF2_K562_rep02_10211 +UUUGUUUCUCAUUUCCUCCCUUAAUGACUUCUUUUGAGGUAAACACAUACUGUUCUAAUAU +>U2AF2_K562_rep02_10212 +AGCUACACUAAAAAUCAACAAUGAGAUUAGAAGUGUGAAAAGAUUGCAGCUGCUACCAGAA +>U2AF2_K562_rep02_10213 +UCUCUCUUUUCCCUCCUCCCCACCAGAGAGGAGCUGCGGAGUCUAUUCCAGGCCCGGGCCA +>U2AF2_K562_rep02_10214 +UUCCCCCAUUCUUAAUCUUGCAGCUCCUGGAUCUCCCAGGUAUCAUUGAAGGUGCCAAGGA +>U2AF2_K562_rep02_10215 +GGGAGGGAGGCGUCGCGGAGUUUCUCUCGGCCUUUUGUGCCAUCCGCCGAGGCGCCUUGAG +>U2AF2_K562_rep02_10216 +GGGAGGGAGGCGUCGCGGAGUUUCUCUCGGCCUUUUGUGCCAUCCGCCGAGGCGCCUUGAG +>U2AF2_K562_rep02_10217 +CUUCUUUCCUUCCUUCCUUCCCUGUUUCCUUCCCUCUUUCCUUCCUUCCUCCUGGUCUGUU +>U2AF2_K562_rep02_10218 +CUGAAUACACUCACUUUUAUGGUGGCAAGAAGCCAGGUAAGGCAUGCAGUCUUUCUGUUCC +>U2AF2_K562_rep02_10219 +CUGAAUACACUCACUUUUAUGGUGGCAAGAAGCCAGGUAAGGCAUGCAGUCUUUCUGUUCC +>U2AF2_K562_rep02_11141 +CAGUCUUUUCUCUCUUUCUCCUGCAGGGCUACACCAAGUCCAUUGAUAUUUGGUCUGUAGG +>U2AF2_K562_rep02_11142 +UUUGAUUAUUACUCUCAGACGUGCGUGGCAACAAGUGACUGAGACCUAGAAAUCCAAGCGU +>U2AF2_K562_rep02_11143 +CCAGGCAAGCCGAUUUUUUCAGUUGAUAUUCACCCUGACGGGACCAAGUUCGCAACUGGAG +>U2AF2_K562_rep02_11144 +CCAGGCAAGCCGAUUUUUUCAGUUGAUAUUCACCCUGACGGGACCAAGUUCGCAACUGGAG +>U2AF2_K562_rep02_11145 +UCACCUUCUUUCCUCUUGCUGUCAUCUGCAUUCGUGCUUCCCACCUGUUGUUGGCAUGUCC +>U2AF2_K562_rep02_11147 +GUUUCCCUCUUCCUUCCGUCUUGUUUCCUAACUUCUUACCAAAGUUUAGAGUCUGAGUUUU +>U2AF2_K562_rep02_11148 +CAAACCUAGGAUGAAGCUGGAGGCAGAUUCGUCGCUUUCUCUGGAGAAGGACAGUCAUUGC +>U2AF2_K562_rep02_11150 +CUUUUUUGAGACAGACACUGGGCAGCAUCGUGUUCUUCCAGCGGACGUGUCUAGAACAUCU +>U2AF2_K562_rep02_11151 +CAAGUCCAUUGAUAUUUGGUCUGUAGGCUGCAUUCUGGCAGAAAUGCUUUCUAACAGGCCC +>U2AF2_K562_rep02_11152 +GAUAUCAGCUGCAGAUCACUCAAUACAUGGCCGAGACAAAUCUACAUUGGCCGGAAGCAGC +>U2AF2_K562_rep02_11154 +CGCUGUCUCUGCUCCCUCUAGGAAAGGCCACCUGCCUGAGCUUUGAAAUGGCCCACACCGU +>U2AF2_K562_rep02_11156 +UAAUAGCAUUGCUGAUGACAUUUUCCCUGUUAUCAGUUACUUAUGGGGCCAUUCGCUGCAA +>U2AF2_K562_rep02_11158 +UUUAUGUUUCCUAGGGAAGUGCCCGACAGGGUGGCACCACUACGAAGGCACGGCCAGCUGC +>U2AF2_K562_rep02_11159 +UUCCCCACCCCCUGUCUUACAUCCACCCUGGCCCUGUAAAUUCUUUUUUCCUUUGUUGCGU +>U2AF2_K562_rep02_11160 +CUCCUUUUUUUUUCUCCUGAGACAGGGUCUUGCCCUGUUGCCUAAGCAGGCAUGGAGUGGC +>U2AF2_K562_rep02_11164 +CUUUUUUCUCUAAUUGGACUGCAGCGUCAACUAUUCUGCCUCGCUAGAAAGUUCUUGGUAU +>U2AF2_K562_rep02_11165 +UGGAGCCUGGUGGGGAGCUGCUGGAGGGCUUGGGGCCAGGGAGGGAUGUGGCCUGACUUGG +>U2AF2_K562_rep02_11167 +CACCUUCUUAUCUGUGGUGAGGGCCACCCGCUGCCCCUCCCUCCUUCCUAUCCCUGUAUCU +>U2AF2_K562_rep02_11169 +UUCACUUUUAGCUUGUUCCAGCUGCCAGGCUGAGGGGACACCUUACGUCCCUCCCUCCUGA +>U2AF2_K562_rep02_11172 +GACCACUGCCUCUCUCCCCACAGGGACCACUGAAGAAAGACCGAAUUGCAAAGGAAGAAGG +>U2AF2_K562_rep02_11176 +CCACUUGUGUCCACACAGGCCCUGGGAGGAGCGGGGACACUGAGGACCUCUCUCCAAAUUG +>U2AF2_K562_rep02_11177 +UGUAUUUCUGAAUUGUAGAGUCAAAGGAGAAGUUCAGAGUCCCAUCAGCAAUGCACCUGUC +>U2AF2_K562_rep02_11183 +CUCCCGCUGCAUGCAGGGAUUCGGGUUCGUAACUUUCGAGAAUAGUGCUGAUGCAGACAGG +>U2AF2_K562_rep02_11184 +GCUCCCUGGUCUUGAGCAUCUGGGGCCCGAGCUGCCUGGGCAUUGGUUGGAAGUAGCCCUG +>U2AF2_K562_rep02_11187 +UGUUUUCAGAGACUCCCUACGGGAGAGGAUGCCCCGCAGGAACAUGGUAAGUAGUGAGGCG +>U2AF2_K562_rep02_11192 +UAACGAUGUGCAUGUUUUCCCCCCUUCUCCCGCUGCAUGCAGGGAUUCGGGUUCGUAACUU +>U2AF2_K562_rep02_11195 +CUUUGGUUUUUCAGGGCAGCCGAUGAAGUGCAACCUUCACAUGAAUGGGAAUGUUAUCACC +>U2AF2_K562_rep02_11196 +UUCUUCUCAUACCCCUACAGGACAAGAGGACCCUGCCUUGGUGUGAGAGUGAGGGAAGAGG +>U2AF2_K562_rep02_11199 +UCCAAAGCUGGGAGUCAUGUUGCCUGCAGGGACUCUUUCCUUACUGGGCCCAGGAGUUCGA +>U2AF2_K562_rep02_11201 +UUUGCUAUUUUCCCUCACCUCCCAGGGUAAGAUAAUCAGGAGCAGAAUGUGAAGAACUUUC +>U2AF2_K562_rep02_11205 +ACUCUAGCUAGAAGACAGAAGGCCAGCUCCCAAGCAGAUCAGAGGGUGGAAUUUUCAUUCU +>U2AF2_K562_rep02_11206 +UGAUGUGUCUUUUGCAGGUGAAGGUGGGAGACAAGGUCUCUGCUGACGAUGAGGCAGAGCC +>U2AF2_K562_rep02_11207 +AUCAUUUAUUGGAUUUCAGUUCAACAGACACUCCUAUGAGAAGCCCUUUGAGAUACGCCAG +>U2AF2_K562_rep02_11208 +ACGUGGUUUUUGGAUCCGUAGCACCCCGAGCAGAAGGCAGACCGGUAUUUUGUGUUAUACA +>U2AF2_K562_rep02_11211 +UCUCCACAUCUCCCCACAGCGCUGCGCACAUUGUCAGUGACUCUUUGUUGCAUGGUGAGUG +>U2AF2_K562_rep02_11215 +UGGCCCCUUUGCUGUCCAUCCUUUUUCAGGGCGUGGACUCCCUGGUGCUAGAAAGCGUGAU +>U2AF2_K562_rep02_11216 +UGGCCCCUUUGCUGUCCAUCCUUUUUCAGGGCGUGGACUCCCUGGUGCUAGAAAGCGUGAU +>U2AF2_K562_rep02_11226 +GCUUUUUACUUUCUCACGCAGGUCUGGCCUAAGAAGGAAAUGGAAAAUGAAAAGGCUUGAA +>U2AF2_K562_rep02_11227 +UGGUUUCUCUCCCUCGGCACCUGUUGCCUAGGAGUGGUCCGCAGACCUGAAUCGAACCCUC +>U2AF2_K562_rep02_11228 +ACUAAAUGUUAUUUCCUGAGUCACUUUUUUAAAGAGCUGCAUAAGCAACAAAGCUGCAUCA +>U2AF2_K562_rep02_11229 +CGUCUGCUCCUACUCCACAGCCGCGUCGUGUGACUCCUUCAAGAACCAGCUGGUCACCCGG +>U2AF2_K562_rep02_11234 +UUCUCUCUUUACAGGUGCUGGGCUGUGCUGUGGAGCUCCCUGAUGUCAGCUGCAAGCGGUU +>U2AF2_K562_rep02_11240 +UUUUCUCCUUUCAUUACCUACCUCUCCAUUAUGCCUCAGUUGUAACGGUGAGUAAAACUAU +>U2AF2_K562_rep02_11241 +CACUUCCUGUCACCUCCCAGGGCUCCCCCAUCCUGCUGGCUGCCAGGCGGGUUGGCCGCUC +>U2AF2_K562_rep02_11253 +CUUCCUUAGUUUUUGUCUUUUUUGAUCUGACUGUAGAUGAUCAGUCAGUUUAUCCUAAGGC +>U2AF2_K562_rep02_11254 +UUUAUUUCCUUCGGGACCUGGGGACAGGGUUUGGUCAGCACCUGCAAGGUCUGUAGUUGCC +>U2AF2_K562_rep02_11255 +AUUGCUUUGCAAUUCCAGGAGCGGCAUUGCCCCCGAAUGUCCAGAUUAUCCCUGUUUUUGU +>U2AF2_K562_rep02_12216 +UUCCCUUUUGUUCCCAGUGCCCCUCGCUGCCUUGUGUUCUUUGACAUUGGAAAGAAGGUCU +>U2AF2_K562_rep02_12217 +CUCCUUUCUUCCUUCCCUUCCCUUCCCCUCCCCUCCCCCAGGCUGGAGUGCAGAGGCACGA +>U2AF2_K562_rep02_12218 +CUCCUUUCUUCCUUCCCUUCCCUUCCCCUCCCCUCCCCCAGGCUGGAGUGCAGAGGCACGA +>U2AF2_K562_rep02_12219 +AGAUUUUCCACAGGUGUGGGCCCCAUUAGCUCUGGCCACCUGAGAAAGCCCUCAGGCAAAG +>U2AF2_K562_rep02_12220 +GGAUGUUAAUUCUUCUCUAUUUUAGAUUUUCCACAGGUGUGGGCCCCAUUAGCUCUGGCCA +>U2AF2_K562_rep02_12221 +UUACAGGUAUCACGCUCAUUGCUGUGGAUGAGGCUCACUGUAUUUCUGAGUGGGGGCAUGA +>U2AF2_K562_rep02_12222 +CUUUUCACAGUCCUCUUACUCCCAGUUACUGGCAGCUACAUGCCUUACCAAGCUUGUAUCA +>U2AF2_K562_rep02_12223 +CCUGUUUUUUUUUCCCCCUGGCAGAGUUAGCCACUUCUUCCUAUGUGUAAGCAUAUCAUCA +>U2AF2_K562_rep02_12224 +UUUAUGUUUUUUUUUCAGGGGAGCGGAAUAUUGGUUUCUUUUACUUGUUGUUUUCAGUUUU +>U2AF2_K562_rep02_12225 +CCCUCUUUCUCUCUCAGCUCCCACAGGCCCAUUCUGGUGACUCAUGACUUGUAUACACAGA +>U2AF2_K562_rep02_12226 +UUUUUUUUUUUUUUUUUAAUAGGGUCUCACUCUGUUGCUCGUGCUGGAGUGACAGUGGUGU +>U2AF2_K562_rep02_12227 +CCUUCCUUUCUUUUUCCCGCUUCCUUAAUGUAAUUUAAACCCUGGCAAACAUUCUUUAGAA +>U2AF2_K562_rep02_12228 +UUUUUCCAGGAGCUGGAGGAGGGAAUGAUAUUCAGUGGUGUUUUUCUCAGGUGAAAGGAGC +>U2AF2_K562_rep02_12229 +AUCCUUUCCUCCGUUUAGGAGCUGCAGUGAACACUUUUCAUUGAACAUGUAGCAUGAAGAG +>U2AF2_K562_rep02_12230 +CAUUAUUUGUUUACUCAUUUGGAGUGUUCCUUGACUUUUAUCCCCUCUUACCUAGUGACAU +>U2AF2_K562_rep02_12231 +AGAUAGAUCCAUUUAUCCUGCCUCCUAGGGAGAAGUUUCUGCCUGGAUUGAAACAAAAAAA +>U2AF2_K562_rep02_12232 +AACAGUGUAAAUUUGAUGGCCAGGAGACAAAAGGAUCCAAGUUCAUUACCUCCAGUGCGAG +>U2AF2_K562_rep02_12233 +CCUUUUUCUCCUCUUUACCGCAUCUUUCGUCUUGCAACACAGAGACCUAAAGGGCAAGGAA +>U2AF2_K562_rep02_12234 +UAUUUUCCAGGCCAGAGAUCCUCAGCAGGAGCCUAUGGAAGAGAUAGAAAAUUUGAAGAAA +>U2AF2_K562_rep02_12235 +CUGUUGCUCGUGCUGGAGUGACAGUGGUGUGAUCUUGGUUCGCUGCAACCUCCGCCUCUUG +>U2AF2_K562_rep02_12236 +UCAGAUACAAGUAUUGUUGGUCUUAUUUUCCAGGCCAGAGAUCCUCAGCAGGAGCCUAUGG +>U2AF2_K562_rep02_12237 +UUGUUCCCCUUUCCCAUUCCAGGGAGCUCUGGGCUCUGUUCUACUUAUUCGUAUUGGCAGG +>U2AF2_K562_rep02_12238 +CCUUCCUUUCUUUUUUUUAGAAGGCAUCUCACACUGUCACCCAGGCUGGAGUGCUGGAGUG +>U2AF2_K562_rep02_12239 +CCUUCCUUCCUUCCUUUUCUUCCUUUCUUUUCCUACCUUCCUUUUCCUUCCUUCCUUUCUU +>U2AF2_K562_rep02_12243 +UGUUCUCUUCUUGUUUCUUCUUCCCCACCAGCCAAAAAUCUAUGAUGUUAUAGCAAGGAUC +>U2AF2_K562_rep02_12244 +CUUCUUUUUCUGCACAGGCAGACACCACCCAUCCUUUAACCAAGCACAGAAAAAUAGCCUC +>U2AF2_K562_rep02_12245 +UCAGAGAUCUGCAGCGAAUAACCCUGCCCAGCAUUAACCGCCUCAGGCACUUCACCAAUGA +>U2AF2_K562_rep02_12249 +UUUUAGGCGUAAUUUUCAUUUUUUCAGAUGUUUUUCUACUUAAAUAGCACAUAUGCAGAAG +>U2AF2_K562_rep02_12250 +UUGAUUUUUUUUCCCCCUAGAGGAAGAAAUCCUACUUAGCGACAUGAACAAACAGUUGACU +>U2AF2_K562_rep02_12251 +CAGUGGUGCGAGGCAUAAUUUCUUCCUUAGGUUCCAGCAGAAAUGGAAGGGUUAGGACGAU +>U2AF2_K562_rep02_12252 +UUUUCCAGUAUGACAUGAUGGGAAGAAAUCAGACUGCUGUGAGAGAAGAGAUGAUUCUCCU +>U2AF2_K562_rep02_12253 +AUUCUUCAGUUAGCUUCAUCUUCAGAGCAAGCUGAUGAUGGCUUGUGUGUGCUAGCAGGAU +>U2AF2_K562_rep02_12254 +CCUUUCUUCCUUCCUUUCCUCCUUCCUCUUCUCCUCCUCCCCUUCCUUCCUUCCUUCCUUC +>U2AF2_K562_rep02_12255 +AUUCUUUCUCUUUUAGGUCCAGGUCCUAACAUUUGAUAGUCAUUUAAAGGCAUGAAGAUUC +>U2AF2_K562_rep02_12256 +UUUUUUUUUUCCACCUACAGCAGCUGUUUUUACCCUGUGGUCAGUCAGGUACUAUAUUUAG +>U2AF2_K562_rep02_12257 +CAGCUGUCUCCUUCUCUUACAGGGUGGGGAGAAACAGCGGGUCUUCACUGGUAUUGUUACC +>U2AF2_K562_rep02_12258 +AGGACAGGACCUUGCUGGGAACCUUCAGUAAGUUGUCCUUUUCUUUCUCAAACUUCCCAUG +>U2AF2_K562_rep02_12259 +UUCUUCUUCAUCUAGGGGCUCUUGGCCAGCUGGGAGUGGGGCUUGCUAAUCUUUUGAGGUA +>U2AF2_K562_rep02_12260 +ACCAACUAGGAUUUUUCUCAGGAGCACAUGGAUGAAGUAUGCUCCUCGCAGCUUCUAACUU +>U2AF2_K562_rep02_12261 +UUUUUUAAGGGACAGGGUCUUGAUCUGUCACCCAAGCUGGAGUGCUGAGGUGUGAUUGUAA +>U2AF2_K562_rep02_12262 +GUCUUCUGUUUUCCCCAGGCAGGGUGCCUGAGCUGUAUUCCCCAGCACACCCACUCCCGCA +>U2AF2_K562_rep02_12263 +AUUUCUGCACAUCUAGGAUGACAGUACGAGCCAUAGUGACCACCAAGACCCCAUCUCAUUA +>U2AF2_K562_rep02_12265 +UGGAUUUGUACAUUAUAGGUUCAUUGCCCUCAAGUGGCAGAAGGAAAAGCACAUGGAAUAU +>U2AF2_K562_rep02_12266 +UUUACUUUUUUUCUUUAAGGAUGGAUGUUGUGUUCUCUUUAUUUUUUUCCUACUACUUUAA +>U2AF2_K562_rep02_12267 +CCUUCCUUCCUCCCUUCCUUCCUUUCUGUUAUUCAGCCAGAAGUAUCAGCAUCACUGUUCU +>U2AF2_K562_rep02_12268 +UUUUGUUGGUUCUUUGAGCCUCUCACAGGUUGCAUCAUAGUCUAUGUGGAUAGAUGAAGAA +>U2AF2_K562_rep02_12269 +UUUUUUUUUUUUUUUUUUUUUUUUUUUGGUAGGAAACUCAACAGUGUAAAUUUGAUGGCCA +>U2AF2_K562_rep02_12274 +UGAUUUUGUCCCCUAGAGCAAGGUCCGUGGUCCUGUCAGUGGAAGCCCGGAUAGCAUGAAU +>U2AF2_K562_rep02_12275 +GGUGGGGUGGGGGCGGGGAGGGCUCCCGGGAGGCAAGUGGUCACGGUGAGAGUCACUGGGC +>U2AF2_K562_rep02_12276 +UACCCAUUGCUUUUACUGAUUAGGUAUGAAUUUCAGCCCUUUAUUUCCUUCUAAUUUUGGA +>U2AF2_K562_rep02_12279 +CCUCAUUUCACCCAGGAGGAAGGUGCAGCUCAGAGCUGUUACGACUAGUCAGAGAGAGCGA +>U2AF2_K562_rep02_12281 +AUAAUUCUUACCUGCCUCCUUUCUCUUCCCGGACCUUCCUAAUUUGAAGAGGUGAUUUGGA +>U2AF2_K562_rep02_12286 +UUUCUCUCCCUAAUCUUUUCUCCAAUCAGGCUUCAAUGUUAGCUGCAGAAAAUGACCCUUA +>U2AF2_K562_rep02_12287 +UUUUUGUUUUUCAGCCCUGGUACCUGACAGUGUAAAGAAGGAGCUCCUACAAAGAAUAAGA +>U2AF2_K562_rep02_12292 +UUUACCUGGGUAACAAUUUUACUUUUUACCACAGUCACCAAGGAGCUAGUUAGCUGGAUGA +>U2AF2_K562_rep02_12293 +UAGUUUGCAGGUCGAAGUAAGAAGGAAACCAAAUAUUCUCUUAAGGCUGUCGAAGACAUGU +>U2AF2_K562_rep02_12299 +UUUGUUUUUCUUUUCAGGUAUGGAACCCUUCAGAUCAAAGCUUACCAAUAAAUUCAGUAUG +>U2AF2_K562_rep02_12300 +UUUGUUUUUCUUUUCAGGUAUGGAACCCUUCAGAUCAAAGCUUACCAAUAAAUUCAGUAUG +>U2AF2_K562_rep02_12302 +CUCAUUUUUCUCUUGCCGCCGCCAUGUAAGAGGUAACUUUCACCUCCCGUCAUGAUUCUGA +>U2AF2_K562_rep02_12303 +UUAUUUUUCUUAUUUAGGGAAGGUUACCGCCACCUCUCUGUAGGAAAUCAAGUGUACAUGA +>U2AF2_K562_rep02_12305 +ACUUGCUAUCCUUCCCUUGCAGGAAGACACGUUUCAGCAGUAUGUAAGACCAGAGAUUAAC +>U2AF2_K562_rep02_12306 +CUUGUGCAAUUUCCAGGUGAUGAACAGCCUCCUUCUAAAUCAUUGACCACAUUUCUUAUUC +>U2AF2_K562_rep02_12307 +UUCUCUUUUUGUGCCAGGUCAUACUUUAAGGAGCCCAAGAGCUUUAUAACAUAACAAAAGA +>U2AF2_K562_rep02_12308 +UUCUCUUUUUGUGCCAGGUCAUACUUUAAGGAGCCCAAGAGCUUUAUAACAUAACAAAAGA +>U2AF2_K562_rep02_12311 +UCCCUUAAACUUUAUACCACCAGAAUACCAACAGAAGCUAAAUGUAGCAAAUGUGACUGCC +>U2AF2_K562_rep02_12312 +AAAAUUAAGUUCUUUUAUUAGCUGGCCGUUCUCUCAUUAUCUCAAAUUUAUUUAAGUAUUU +>U2AF2_K562_rep02_12316 +UUUUCUUCUUUGUAGCAUGGAGCAGAUCCAACUAAAAAGAACAGAGAUGGAAAUACACCUU +>U2AF2_K562_rep02_12317 +CUUUUCUCUAGGUUAGUAACACUGAAGAAAUCACUUUUGAAGCAUUGAAGAAAGCAAUUGG +>U2AF2_K562_rep02_12318 +UCAUAGCUCCUUCUCCCCCUGCUUCUUUCCCAAAUGAAUGAGUAUUUCUUUUAGAUAAAUU +>U2AF2_K562_rep02_12321 +AUUAUUUUUUUGUGUUGGCCAGGAAGUGAACCCAGGUCAACUGCUUGGAAGGUGGCUAUGC +>U2AF2_K562_rep02_12322 +ACAGGCCCAGACCUUCUCUUUCCCUUUCCAGCAGCCGGAGAAGUGCGACAACAACCAGUAC +>U2AF2_K562_rep02_12323 +CCCACCGCCUUGACACCCCCACCCCCGCAGGGAAGCAGCUGGUGCACUACACAGCGCAGCC +>U2AF2_K562_rep02_12324 +UUUUUUCAUUACAUUACAGGAAGCAGAAUCUGGUAAUAUAAGUCAAAAGUCUGAUGAAGAA +>U2AF2_K562_rep02_12325 +GUUUUCUUUUUUCCCUUUCCCAGUUUGACUUUUGCCAUCUAGAGUUUGUAAAUUAAGUGGU +>U2AF2_K562_rep02_12326 +CUUUCCCUUCCACAGCCCAGGGUCCGUCUGCAUUUUGUGGAGCUGGGCUCCGGCCCUGCUG +>U2AF2_K562_rep02_12334 +UUUGACUUUGCUUUGCUUUUCCCCUUUUGUGUUUGCAGUUGAAUGGAGAGGUUUUCAUAUU +>U2AF2_K562_rep02_12335 +AUAUUAAACUCUUCAGAAGGAAGUCACUGUGCAUAGCCAUCCCCUAAGAAGAGGGCAUUCC +>U2AF2_K562_rep02_12336 +ACACUUCUGUUCCUUUGUCUGCAGGAGAGCUGGAGGUGUUUCAGAAAGAUGGGGAACGAAA +>U2AF2_K562_rep02_12337 +UAAAACUGUGGUUUGCAAGCAGAAGGCGCUGGAACUGUUGCCCAAGGUGGAAGAGGUGGUG +>U2AF2_K562_rep02_12338 +CUAUCCUUCUACCUCCACGCACGUUUUUUAAGGCAGCGGCAAAAGUAGUAGAAAGCAAAAG +>U2AF2_K562_rep02_12339 +UCAGCUUUUUAAUUAAAUGAAGCCAAGUGGGAUUUGCAUAAAGUGAAUGUUUACCAUGAAG +>U2AF2_K562_rep02_12340 +UUUUCCUCCUCAAUCUUCCUUUGCCCUACCUAUGUGUUACUAGAGAACAUUUCUACAAAUU +>U2AF2_K562_rep02_12341 +UCUUUUUCCUUCCUCCCUCCCUGUCUCCCUCCCUCUCUGCCUCCCUCCCUCCCUCCCUCUU +>U2AF2_K562_rep02_12342 +UGUCUUUUUUUCUUUAGUGCUCCAGACAAUGAAACAUCCAAAUCUGCUAAUCAAGAUACCU +>U2AF2_K562_rep02_12343 +CUUUGUACCAAUAGGUAAUUUGUCGUCCAGAUGCUCUGCUAUAUGUGAAGUAUCAUUUUUC +>U2AF2_K562_rep02_12344 +CUUUGUACCAAUAGGUAAUUUGUCGUCCAGAUGCUCUGCUAUAUGUGAAGUAUCAUUUUUC +>U2AF2_K562_rep02_12352 +UUUUUCCUCUGAAUUUACAUGGAAGGAGCGGUAGAUGAUGAGACAUAUAAGAUCCUCACAU +>U2AF2_K562_rep02_12353 +AGAUGCCACUGCCUCCUUUCCAUUGUCAGCUGGCGGGUGACGCGACUGUUGUUGCACUGGG +>U2AF2_K562_rep02_12354 +AGAUGCCACUGCCUCCUUUCCAUUGUCAGCUGGCGGGUGACGCGACUGUUGUUGCACUGGG +>U2AF2_K562_rep02_12355 +CUAACUUCUCUAGCCAAAUACAGAUAGUCUUUCCCACUGAGUGUCUGUCAACAACUAGAUU +>U2AF2_K562_rep02_12356 +UCCCUGAUUCUUUUUCAAGGGCCGCUUGAAGAUGCCAUUGAAGAUGAGGAAGAAGAAUGUC +>U2AF2_K562_rep02_12357 +AUUUUAAUUCUAGUCUAGGUGAUGGCUGCUCCUUUCCAACUUGCCUUGUUAACCAGGAUCC diff -r 000000000000 -r 7653ebd919bb test-data/fimo_background_probs_hsa_chrM.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/fimo_background_probs_hsa_chrM.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,7 @@ +# 0-order Markov frequencies from file hsa_chrM.fa +# seqs: 1 min: 16569 max: 16569 avg: 16569.0 sum: 16569 alph: DNA +# order 0 +A 3.093e-01 +C 3.127e-01 +G 1.309e-01 +T 2.471e-01 diff -r 000000000000 -r 7653ebd919bb test-data/hsa_chrM.fa --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/hsa_chrM.fa Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,238 @@ +>chrM +GATCACAGGTCTATCACCCTATTAACCACTCACGGGAGCTCTCCATGCATTTGGTATTTTCGTCTGGGGG +GTATGCACGCGATAGCATTGCGAGACGCTGGAGCCGGAGCACCCTATGTCGCAGTATCTGTCTTTGATTC +CTGCCTCATCCTATTATTTATCGCACCTACGTTCAATATTACAGGCGAACATACTTACTAAAGTGTGTTA +ATTAATTAATGCTTGTAGGACATAATAATAACAATTGAATGTCTGCACAGCCACTTTCCACACAGACATC +ATAACAAAAAATTTCCACCAAACCCCCCCTCCCCCGCTTCTGGCCACAGCACTTAAACACATCTCTGCCA +AACCCCAAAAACAAAGAACCCTAACACCAGCCTAACCAGATTTCAAATTTTATCTTTTGGCGGTATGCAC +TTTTAACAGTCACCCCCCAACTAACACATTATTTTCCCCTCCCACTCCCATACTACTAATCTCATCAATA +CAACCCCCGCCCATCCTACCCAGCACACACACACCGCTGCTAACCCCATACCCCGAACCAACCAAACCCC +AAAGACACCCCCCACAGTTTATGTAGCTTACCTCCTCAAAGCAATACACTGAAAATGTTTAGACGGGCTC +ACATCACCCCATAAACAAATAGGTTTGGTCCTAGCCTTTCTATTAGCTCTTAGTAAGATTACACATGCAA +GCATCCCCGTTCCAGTGAGTTCACCCTCTAAATCACCACGATCAAAAGGAACAAGCATCAAGCACGCAGC +AATGCAGCTCAAAACGCTTAGCCTAGCCACACCCCCACGGGAAACAGCAGTGATTAACCTTTAGCAATAA +ACGAAAGTTTAACTAAGCTATACTAACCCCAGGGTTGGTCAATTTCGTGCCAGCCACCGCGGTCACACGA +TTAACCCAAGTCAATAGAAGCCGGCGTAAAGAGTGTTTTAGATCACCCCCTCCCCAATAAAGCTAAAACT +CACCTGAGTTGTAAAAAACTCCAGTTGACACAAAATAGACTACGAAAGTGGCTTTAACATATCTGAACAC +ACAATAGCTAAGACCCAAACTGGGATTAGATACCCCACTATGCTTAGCCCTAAACCTCAACAGTTAAATC +AACAAAACTGCTCGCCAGAACACTACGAGCCACAGCTTAAAACTCAAAGGACCTGGCGGTGCTTCATATC +CCTCTAGAGGAGCCTGTTCTGTAATCGATAAACCCCGATCAACCTCACCACCTCTTGCTCAGCCTATATA +CCGCCATCTTCAGCAAACCCTGATGAAGGCTACAAAGTAAGCGCAAGTACCCACGTAAAGACGTTAGGTC +AAGGTGTAGCCCATGAGGTGGCAAGAAATGGGCTACATTTTCTACCCCAGAAAACTACGATAGCCCTTAT +GAAACTTAAGGGTCGAAGGTGGATTTAGCAGTAAACTAAGAGTAGAGTGCTTAGTTGAACAGGGCCCTGA +AGCGCGTACACACCGCCCGTCACCCTCCTCAAGTATACTTCAAAGGACATTTAACTAAAACCCCTACGCA +TTTATATAGAGGAGACAAGTCGTAACATGGTAAGTGTACTGGAAAGTGCACTTGGACGAACCAGAGTGTA +GCTTAACACAAAGCACCCAACTTACACTTAGGAGATTTCAACTTAACTTGACCGCTCTGAGCTAAACCTA +GCCCCAAACCCACTCCACCTTACTACCAGACAACCTTAGCCAAACCATTTACCCAAATAAAGTATAGGCG +ATAGAAATTGAAACCTGGCGCAATAGATATAGTACCGCAAGGGAAAGATGAAAAATTATAACCAAGCATA +ATATAGCAAGGACTAACCCCTATACCTTCTGCATAATGAATTAACTAGAAATAACTTTGCAAGGAGAGCC +AAAGCTAAGACCCCCGAAACCAGACGAGCTACCTAAGAACAGCTAAAAGAGCACACCCGTCTATGTAGCA +AAATAGTGGGAAGATTTATAGGTAGAGGCGACAAACCTACCGAGCCTGGTGATAGCTGGTTGTCCAAGAT +AGAATCTTAGTTCAACTTTAAATTTGCCCACAGAACCCTCTAAATCCCCTTGTAAATTTAACTGTTAGTC +CAAAGAGGAACAGCTCTTTGGACACTAGGAAAAAACCTTGTAGAGAGAGTAAAAAATTTAACACCCATAG +TAGGCCTAAAAGCAGCCACCAATTAAGAAAGCGTTCAAGCTCAACACCCACTACCTAAAAAATCCCAAAC +ATATAACTGAACTCCTCACACCCAATTGGACCAATCTATCACCCTATAGAAGAACTAATGTTAGTATAAG +TAACATGAAAACATTCTCCTCCGCATAAGCCTGCGTCAGATTAAAACACTGAACTGACAATTAACAGCCC +AATATCTACAATCAACCAACAAGTCATTATTACCCTCACTGTCAACCCAACACAGGCATGCTCATAAGGA +AAGGTTAAAAAAAGTAAAAGGAACTCGGCAAATCTTACCCCGCCTGTTTACCAAAAACATCACCTCTAGC +ATCACCAGTATTAGAGGCACCGCCTGCCCAGTGACACATGTTTAACGGCCGCGGTACCCTAACCGTGCAA +AGGTAGCATAATCACTTGTTCCTTAAATAGGGACCTGTATGAATGGCTCCACGAGGGTTCAGCTGTCTCT +TACTTTTAACCAGTGAAATTGACCTGCCCGTGAAGAGGCGGGCATAACACAGCAAGACGAGAAGACCCTA +TGGAGCTTTAATTTATTAATGCAAACAGTACCTAACAAACCCACAGGTCCTAAACTACCAAACCTGCATT +AAAAATTTCGGTTGGGGCGACCTCGGAGCAGAACCCAACCTCCGAGCAGTACATGCTAAGACTTCACCAG +TCAAAGCGAACTACTATACTCAATTGATCCAATAACTTGACCAACGGAACAAGTTACCCTAGGGATAACA +GCGCAATCCTATTCTAGAGTCCATATCAACAATAGGGTTTACGACCTCGATGTTGGATCAGGACATCCCG +ATGGTGCAGCCGCTATTAAAGGTTCGTTTGTTCAACGATTAAAGTCCTACGTGATCTGAGTTCAGACCGG +AGTAATCCAGGTCGGTTTCTATCTACNTTCAAATTCCTCCCTGTACGAAAGGACAAGAGAAATAAGGCCT +ACTTCACAAAGCGCCTTCCCCCGTAAATGATATCATCTCAACTTAGTATTATACCCACACCCACCCAAGA +ACAGGGTTTGTTAAGATGGCAGAGCCCGGTAATCGCATAAAACTTAAAACTTTACAGTCAGAGGTTCAAT +TCCTCTTCTTAACAACATACCCATGGCCAACCTCCTACTCCTCATTGTACCCATTCTAATCGCAATGGCA +TTCCTAATGCTTACCGAACGAAAAATTCTAGGCTATATACAACTACGCAAAGGCCCCAACGTTGTAGGCC +CCTACGGGCTACTACAACCCTTCGCTGACGCCATAAAACTCTTCACCAAAGAGCCCCTAAAACCCGCCAC +ATCTACCATCACCCTCTACATCACCGCCCCGACCTTAGCTCTCACCATCGCTCTTCTACTATGAACCCCC +CTCCCCATACCCAACCCCCTGGTCAACCTCAACCTAGGCCTCCTATTTATTCTAGCCACCTCTAGCCTAG +CCGTTTACTCAATCCTCTGATCAGGGTGAGCATCAAACTCAAACTACGCCCTGATCGGCGCACTGCGAGC +AGTAGCCCAAACAATCTCATATGAAGTCACCCTAGCCATCATTCTACTATCAACATTACTAATAAGTGGC +TCCTTTAACCTCTCCACCCTTATCACAACACAAGAACACCTCTGATTACTCCTGCCATCATGACCCTTGG +CCATAATATGATTTATCTCCACACTAGCAGAGACCAACCGAACCCCCTTCGACCTTGCCGAAGGGGAGTC +CGAACTAGTCTCAGGCTTCAACATCGAATACGCCGCAGGCCCCTTCGCCCTATTCTTCATAGCCGAATAC +ACAAACATTATTATAATAAACACCCTCACCACTACAATCTTCCTAGGAACAACATATGACGCACTCTCCC +CTGAACTCTACACAACATATTTTGTCACCAAGACCCTACTTCTAACCTCCCTGTTCTTATGAATTCGAAC +AGCATACCCCCGATTCCGCTACGACCAACTCATACACCTCCTATGAAAAAACTTCCTACCACTCACCCTA +GCATTACTTATATGATATGTCTCCATACCCATTACAATCTCCAGCATTCCCCCTCAAACCTAAGAAATAT +GTCTGATAAAAGAGTTACTTTGATAGAGTAAATAATAGGAGCTTAAACCCCCTTATTTCTAGGACTATGA +GAATCGAACCCATCCCTGAGAATCCAAAATTCTCCGTGCCACCTATCACACCCCATCCTAAAGTAAGGTC +AGCTAAATAAGCTATCGGGCCCATACCCCGAAAATGTTGGTTATACCCTTCCCGTACTAATTAATCCCCT +GGCCCAACCCGTCATCTACTCTACCATCTTTGCAGGCACACTCATCACAGCGCTAAGCTCGCACTGATTT +TTTACCTGAGTAGGCCTAGAAATAAACATGCTAGCTTTTATTCCAGTTCTAACCAAAAAAATAAACCCTC +GTTCCACAGAAGCTGCCATCAAGTATTTCCTCACGCAAGCAACCGCATCCATAATCCTTCTAATAGCTAT +CCTCTTCAACAATATACTCTCCGGACAATGAACCATAACCAATACTACCAATCAATACTCATCATTAATA +ATCATAATAGCTATAGCAATAAAACTAGGAATAGCCCCCTTTCACTTCTGAGTCCCAGAGGTTACCCAAG +GCACCCCTCTGACATCCGGCCTGCTTCTTCTCACATGACAAAAACTAGCCCCCATCTCAATCATATACCA +AATCTCTCCCTCACTAAACGTAAGCCTTCTCCTCACTCTCTCAATCTTATCCATCATAGCAGGCAGTTGA +GGTGGATTAAACCAAACCCAGCTACGCAAAATCTTAGCATACTCCTCAATTACCCACATAGGATGAATAA +TAGCAGTTCTACCGTACAACCCTAACATAACCATTCTTAATTTAACTATTTATATTATCCTAACTACTAC +CGCATTCCTACTACTCAACTTAAACTCCAGCACCACGACCCTACTACTATCTCGCACCTGAAACAAGCTA +ACATGACTAACACCCTTAATTCCATCCACCCTCCTCTCCCTAGGAGGCCTGCCCCCGCTAACCGGCTTTT +TGCCCAAATGGGCCATTATCGAAGAATTCACAAAAAACAATAGCCTCATCATCCCCACCATCATAGCCAC +CATCACCCTCCTTAACCTCTACTTCTACCTACGCCTAATCTACTCCACCTCAATCACACTACTCCCCATA +TCTAACAACGTAAAAATAAAATGACAGTTTGAACATACAAAACCCACCCCATTCCTCCCCACACTCATCG +CCCTTACCACGCTACTCCTACCTATCTCCCCTTTTATACTAATAATCTTATAGAAATTTAGGTTAAATAC +AGACCAAGAGCCTTCAAAGCCCTCAGTAAGTTGCAATACTTAATTTCTGTAACAGCTAAGGACTGCAAAA +CCCCACTCTGCATCAACTGAACGCAAATCAGCCACTTTAATTAAGCTAAGCCCTTACTAGACCAATGGGA +CTTAAACCCACAAACACTTAGTTAACAGCTAAGCACCCTAATCAACTGGCTTCAATCTACTTCTCCCGCC +GCCGGGAAAAAAGGCGGGAGAAGCCCCGGCAGGTTTGAAGCTGCTTCTTCGAATTTGCAATTCAATATGA +AAATCACCTCGGAGCTGGTAAAAAGAGGCCTAACCCCTGTCTTTAGATTTACAGTCCAATGCTTCACTCA +GCCATTTTACCTCACCCCCACTGATGTTCGCCGACCGTTGACTATTCTCTACAAACCACAAAGACATTGG +AACACTATACCTATTATTCGGCGCATGAGCTGGAGTCCTAGGCACAGCTCTAAGCCTCCTTATTCGAGCC +GAGCTGGGCCAGCCAGGCAACCTTCTAGGTAACGACCACATCTACAACGTTATCGTCACAGCCCATGCAT +TTGTAATAATCTTCTTCATAGTAATACCCATCATAATCGGAGGCTTTGGCAACTGACTAGTTCCCCTAAT +AATCGGTGCCCCCGATATGGCGTTTCCCCGCATAAACAACATAAGCTTCTGACTCTTACCTCCCTCTCTC +CTACTCCTGCTCGCATCTGCTATAGTGGAGGCCGGAGCAGGAACAGGTTGAACAGTCTACCCTCCCTTAG +CAGGGAACTACTCCCACCCTGGAGCCTCCGTAGACCTAACCATCTTCTCCTTACACCTAGCAGGTGTCTC +CTCTATCTTAGGGGCCATCAATTTCATCACAACAATTATCAATATAAAACCCCCTGCCATAACCCAATAC +CAAACGCCCCTCTTCGTCTGATCCGTCCTAATCACAGCAGTCCTACTTCTCCTATCTCTCCCAGTCCTAG +CTGCTGGCATCACTATACTACTAACAGACCGCAACCTCAACACCACCTTCTTCGACCCCGCCGGAGGAGG +AGACCCCATTCTATACCAACACCTATTCTGATTTTTCGGTCACCCTGAAGTTTATATTCTTATCCTACCA +GGCTTCGGAATAATCTCCCATATTGTAACTTACTACTCCGGAAAAAAAGAACCATTTGGATACATAGGTA +TGGTCTGAGCTATGATATCAATTGGCTTCCTAGGGTTTATCGTGTGAGCACACCATATATTTACAGTAGG +AATAGACGTAGACACACGAGCATATTTCACCTCCGCTACCATAATCATCGCTATCCCCACCGGCGTCAAA +GTATTTAGCTGACTCGCCACACTCCACGGAAGCAATATGAAATGATCTGCTGCAGTGCTCTGAGCCCTAG +GATTCATCTTTCTTTTCACCGTAGGTGGCCTGACTGGCATTGTATTAGCAAACTCATCACTAGACATCGT +ACTACACGACACGTACTACGTTGTAGCCCACTTCCACTATGTCCTATCAATAGGAGCTGTATTTGCCATC +ATAGGAGGCTTCATTCACTGATTTCCCCTATTCTCAGGCTACACCCTAGACCAAACCTACGCCAAAATCC +ATTTCACTATCATATTCATCGGCGTAAATCTAACTTTCTTCCCACAACACTTTCTCGGCCTATCCGGAAT +GCCCCGACGTTACTCGGACTACCCCGATGCATACACCACATGAAACATCCTATCATCTGTAGGCTCATTC +ATTTCTCTAACAGCAGTAATATTAATAATTTTCATGATTTGAGAAGCCTTCGCTTCGAAGCGAAAAGTCC +TAATAGTAGAAGAACCCTCCATAAACCTGGAGTGACTATATGGATGCCCCCCACCCTACCACACATTCGA +AGAACCCGTATACATAAAATCTAGACAAAAAAGGAAGGAATCGAACCCCCCAAAGCTGGTTTCAAGCCAA +CCCCATGGCCTCCATGACTTTTTCAAAAAGGTATTAGAAAAACCATTTCATAACTTTGTCAAAGTTAAAT +TATAGGCTAAATCCTATATATCTTAATGGCACATGCAGCGCAAGTAGGTCTACAAGACGCTACTTCCCCT +ATCATAGAAGAGCTTATCACCTTTCATGATCACGCCCTCATAATCATTTTCCTTATCTGCTTCCTAGTCC +TGTATGCCCTTTTCCTAACACTCACAACAAAACTAACTAATACTAACATCTCAGACGCTCAGGAAATAGA +AACCGTCTGAACTATCCTGCCCGCCATCATCCTAGTCCTCATCGCCCTCCCATCCCTACGCATCCTTTAC +ATAACAGACGAGGTCAACGATCCCTCCCTTACCATCAAATCAATTGGCCACCAATGGTACTGAACCTACG +AGTACACCGACTACGGCGGACTAATCTTCAACTCCTACATACTTCCCCCATTATTCCTAGAACCAGGCGA +CCTGCGACTCCTTGACGTTGACAATCGAGTAGTACTCCCGATTGAAGCCCCCATTCGTATAATAATTACA +TCACAAGACGTCTTGCACTCATGAGCTGTCCCCACATTAGGCTTAAAAACAGATGCAATTCCCGGACGTC +TAAACCAAACCACTTTCACCGCTACACGACCGGGGGTATACTACGGTCAATGCTCTGAAATCTGTGGAGC +AAACCACAGTTTCATGCCCATCGTCCTAGAATTAATTCCCCTAAAAATCTTTGAAATAGGGCCCGTATTT +ACCCTATAGCACCCCCTCTACCCCCTCTAGAGCCCACTGTAAAGCTAACTTAGCATTAACCTTTTAAGTT +AAAGATTAAGAGAACCAACACCTCTTTACAGTGAAATGCCCCAACTAAATACTACCGTATGGCCCACCAT +AATTACCCCCATACTCCTTACACTATTCCTCATCACCCAACTAAAAATATTAAACACAAACTACCACCTA +CCTCCCTCACCAAAGCCCATAAAAATAAAAAATTATAACAAACCCTGAGAACCAAAATGAACGAAAATCT +GTTCGCTTCATTCATTGCCCCCACAATCCTAGGCCTACCCGCCGCAGTACTGATCATTCTATTTCCCCCT +CTATTGATCCCCACCTCCAAATATCTCATCAACAACCGACTAATCACCACCCAACAATGACTAATCAAAC +TAACCTCAAAACAAATGATAACCATACACAACACTAAAGGACGAACCTGATCTCTTATACTAGTATCCTT +AATCATTTTTATTGCCACAACTAACCTCCTCGGACTCCTGCCTCACTCATTTACACCAACCACCCAACTA +TCTATAAACCTAGCCATGGCCATCCCCTTATGAGCGGGCACAGTGATTATAGGCTTTCGCTCTAAGATTA +AAAATGCCCTAGCCCACTTCTTACCACAAGGCACACCTACACCCCTTATCCCCATACTAGTTATTATCGA +AACCATCAGCCTACTCATTCAACCAATAGCCCTGGCCGTACGCCTAACCGCTAACATTACTGCAGGCCAC +CTACTCATGCACCTAATTGGAAGCGCCACCCTAGCAATATCAACCATTAACCTTCCCTCTACACTTATCA +TCTTCACAATTCTAATTCTACTGACTATCCTAGAAATCGCTGTCGCCTTAATCCAAGCCTACGTTTTCAC +ACTTCTAGTAAGCCTCTACCTGCACGACAACACATAATGACCCACCAATCACATGCCTATCATATAGTAA +AACCCAGCCCATGACCCCTAACAGGGGCCCTCTCAGCCCTCCTAATGACCTCCGGCCTAGCCATGTGATT +TCACTTCCACTCCATAACGCTCCTCATACTAGGCCTACTAACCAACACACTAACCATATACCAATGATGG +CGCGATGTAACACGAGAAAGCACATACCAAGGCCACCACACACCACCTGTCCAAAAAGGCCTTCGATACG +GGATAATCCTATTTATTACCTCAGAAGTTTTTTTCTTCGCAGGATTTTTCTGAGCCTTTTACCACTCCAG +CCTAGCCCCTACCCCCCAATTAGGAGGGCACTGGCCCCCAACAGGCATCACCCCGCTAAATCCCCTAGAA +GTCCCACTCCTAAACACATCCGTATTACTCGCATCAGGAGTATCAATCACCTGAGCTCACCATAGTCTAA +TAGAAAACAACCGAAACCAAATAATTCAAGCACTGCTTATTACAATTTTACTGGGTCTCTATTTTACCCT +CCTACAAGCCTCAGAGTACTTCGAGTCTCCCTTCACCATTTCCGACGGCATCTACGGCTCAACATTTTTT +GTAGCCACAGGCTTCCACGGACTTCACGTCATTATTGGCTCAACTTTCCTCACTATCTGCTTCATCCGCC +AACTAATATTTCACTTTACATCCAAACATCACTTTGGCTTCGAAGCCGCCGCCTGATACTGGCATTTTGT +AGATGTGGTTTGACTATTTCTGTATGTCTCCATCTATTGATGAGGGTCTTACTCTTTTAGTATAAATAGT +ACCGTTAACTTCCAATTAACTAGTTTTGACAACATTCAAAAAAGAGTAATAAACTTCGCCTTAATTTTAA +TAATCAACACCCTCCTAGCCTTACTACTAATAATTATTACATTTTGACTACCACAACTCAACGGCTACAT +AGAAAAATCCACCCCTTACGAGTGCGGCTTCGACCCTATATCCCCCGCCCGCGTCCCTTTCTCCATAAAA +TTCTTCTTAGTAGCTATTACCTTCTTATTATTTGATCTAGAAATTGCCCTCCTTTTACCCCTACCATGAG +CCCTACAAACAACTAACCTGCCACTAATAGTTATGTCATCCCTCTTATTAATCATCATCCTAGCCCTAAG +TCTGGCCTATGAGTGACTACAAAAAGGATTAGACTGAACCGAATTGGTATATAGTTTAAACAAAACGAAT +GATTTCGACTCATTAAATTATGATAATCATATTTACCAAATGCCCCTCATTTACATAAATATTATACTAG +CATTTACCATCTCACTTCTAGGAATACTAGTATATCGCTCACACCTCATATCCTCCCTACTATGCCTAGA +AGGAATAATACTATCGCTGTTCATTATAGCTACTCTCATAACCCTCAACACCCACTCCCTCTTAGCCAAT +ATTGTGCCTATTGCCATACTAGTCTTTGCCGCCTGCGAAGCAGCGGTGGGCCTAGCCCTACTAGTCTCAA +TCTCCAACACATATGGCCTAGACTACGTACATAACCTAAACCTACTCCAATGCTAAAACTAATCGTCCCA +ACAATTATATTACTACCACTGACATGACTTTCCAAAAAACACATAATTTGAATCAACACAACCACCCACA +GCCTAATTATTAGCATCATCCCTCTACTATTTTTTAACCAAATCAACAACAACCTATTTAGCTGTTCCCC +AACCTTTTCCTCCGACCCCCTAACAACCCCCCTCCTAATACTAACTACCTGACTCCTACCCCTCACAATC +ATGGCAAGCCAACGCCACTTATCCAGTGAACCACTATCACGAAAAAAACTCTACCTCTCTATACTAATCT +CCCTACAAATCTCCTTAATTATAACATTCACAGCCACAGAACTAATCATATTTTATATCTTCTTCGAAAC +CACACTTATCCCCACCTTGGCTATCATCACCCGATGAGGCAACCAGCCAGAACGCCTGAACGCAGGCACA +TACTTCCTATTCTACACCCTAGTAGGCTCCCTTCCCCTACTCATCGCACTAATTTACACTCACAACACCC +TAGGCTCACTAAACATTCTACTACTCACTCTCACTGCCCAAGAACTATCAAACTCCTGAGCCAACAACTT +AATATGACTAGCTTACACAATAGCTTTTATAGTAAAGATACCTCTTTACGGACTCCACTTATGACTCCCT +AAAGCCCATGTCGAAGCCCCCATCGCTGGGTCAATAGTACTTGCCGCAGTACTCTTAAAACTAGGCGGCT +ATGGTATAATACGCCTCACACTCATTCTCAACCCCCTGACAAAACACATAGCCTACCCCTTCCTTGTACT +ATCCCTATGAGGCATAATTATAACAAGCTCCATCTGCCTACGACAAACAGACCTAAAATCGCTCATTGCA +TACTCTTCAATCAGCCACATAGCCCTCGTAGTAACAGCCATTCTCATCCAAACCCCCTGAAGCTTCACCG +GCGCAGTCATTCTCATAATCGCCCACGGGCTTACATCCTCATTACTATTCTGCCTAGCAAACTCAAACTA +CGAACGCACTCACAGTCGCATCATAATCCTCTCTCAAGGACTTCAAACTCTACTCCCACTAATAGCTTTT +TGATGACTTCTAGCAAGCCTCGCTAACCTCGCCTTACCCCCCACTATTAACCTACTGGGAGAACTCTCTG +TGCTAGTAACCACGTTCTCCTGATCAAATATCACTCTCCTACTTACAGGACTCAACATACTAGTCACAGC +CCTATACTCCCTCTACATATTTACCACAACACAATGGGGCTCACTCACCCACCACATTAACAACATAAAA +CCCTCATTCACACGAGAAAACACCCTCATGTTCATACACCTATCCCCCATTCTCCTCCTATCCCTCAACC +CCGACATCATTACCGGGTTTTCCTCTTGTAAATATAGTTTAACCAAAACATCAGATTGTGAATCTGACAA +CAGAGGCTTACGACCCCTTATTTACCGAGAAAGCTCACAAGAACTGCTAACTCATGCCCCCATGTCTAAC +AACATGGCTTTCTCAACTTTTAAAGGATAACAGCTATCCATTGGTCTTAGGCCCCAAAAATTTTGGTGCA +ACTCCAAATAAAAGTAATAACCATGCACACTACTATAACCACCCTAACCCTGACTTCCCTAATTCCCCCC +ATCCTTACCACCCTCGTTAACCCTAACAAAAAAAACTCATACCCCCATTATGTAAAATCCATTGTCGCAT +CCACCTTTATTATCAGTCTCTTCCCCACAACAATATTCATGTGCCTAGACCAAGAAGTTATTATCTCGAA +CTGACACTGAGCCACAACCCAAACAACCCAGCTCTCCCTAAGCTTCAAACTAGACTACTTCTCCATAATA +TTCATCCCTGTAGCATTGTTCGTTACATGGTCCATCATAGAATTCTCACTGTGATATATAAACTCAGACC +CAAACATTAATCAGTTCTTCAAATATCTACTCATCTTCCTAATTACCATACTAATCTTAGTTACCGCTAA +CAACCTATTCCAACTGTTCATCGGCTGAGAGGGCGTAGGAATTATATCCTTCTTGCTCATCAGTTGATGA +TACGCCCGAGCAGATGCCAACACAGCAGCCATTCAAGCAATCCTATACAACCGTATCGGCGATATCGGTT +TCATCCTCGCCTTAGCATGATTTATCCTACACTCCAACTCATGAGACCCACAACAAATAGCCCTTCTAAA +CGCTAATCCAAGCCTCACCCCACTACTAGGCCTCCTCCTAGCAGCAGCAGGCAAATCAGCCCAATTAGGT +CTCCACCCCTGACTCCCCTCAGCCATAGAAGGCCCCACCCCAGTCTCAGCCCTACTCCACTCAAGCACTA +TAGTTGTAGCAGGAATCTTCTTACTCATCCGCTTCCACCCCCTAGCAGAAAATAGCCCACTAATCCAAAC +TCTAACACTATGCTTAGGCGCTATCACCACTCTGTTCGCAGCAGTCTGCGCCCTTACACAAAATGACATC +AAAAAAATCGTAGCCTTCTCCACTTCAAGTCAACTAGGACTCATAATAGTTACAATCGGCATCAACCAAC +CACACCTAGCATTCCTGCACATCTGTACCCACGCCTTCTTCAAAGCCATACTATTTATGTGCTCCGGGTC +CATCATCCACAACCTTAACAATGAACAAGATATTCGAAAAATAGGAGGACTACTCAAAACCATACCTCTC +ACTTCAACCTCCCTCACCATTGGCAGCCTAGCATTAGCAGGAATACCTTTCCTCACAGGTTTCTACTCCA +AAGACCACATCATCGAAACCGCAAACATATCATACACAAACGCCTGAGCCCTATCTATTACTCTCATCGC +TACCTCCCTGACAAGCGCCTATAGCACTCGAATAATTCTTCTCACCCTAACAGGTCAACCTCGCTTCCCC +ACCCTTACTAACATTAACGAAAATAACCCCACCCTACTAAACCCCATTAAACGCCTGGCAGCCGGAAGCC +TATTCGCAGGATTTCTCATTACTAACAACATTTCCCCCGCATCCCCCTTCCAAACAACAATCCCCCTCTA +CCTAAAACTCACAGCCCTCGCTGTCACTTTCCTAGGACTTCTAACAGCCCTAGACCTCAACTACCTAACC +AACAAACTTAAAATAAAATCCCCACTATGCACATTTTATTTCTCCAACATACTCGGATTCTACCCTAGCA +TCACACACCGCACAATCCCCTATCTAGGCCTTCTTACGAGCCAAAACCTGCCCCTACTCCTCCTAGACCT +AACCTGACTAGAAAAGCTATTACCTAAAACAATTTCACAGCACCAAATCTCCACCTCCATCATCACCTCA +ACCCAAAAAGGCATAATTAAACTTTACTTCCTCTCTTTCTTCTTCCCACTCATCCTAACCCTACTCCTAA +TCACATAACCTATTCCCCCGAGCAATCTCAATTACAATATATACACCAACAAACAATGTTCAACCAGTAA +CTACTACTAATCAACGCCCATAATCATACAAAGCCCCCGCACCAATAGGATCCTCCCGAATCAACCCTGA +CCCCTCTCCTTCATAAATTATTCAGCTTCCTACACTATTAAAGTTTACCACAACCACCACCCCATCATAC +TCTTTCACCCACAGCACCAATCCTACCTCCATCGCTAACCCCACTAAAACACTCACCAAGACCTCAACCC +CTGACCCCCATGCCTCAGGATACTCCTCAATAGCCATCGCTGTAGTATATCCAAAGACAACCATCATTCC +CCCTAAATAAATTAAAAAAACTATTAAACCCATATAACCTCCCCCAAAATTCAGAATAATAACACACCCG +ACCACACCGCTAACAATCAATACTAAACCCCCATAAATAGGAGAAGGCTTAGAAGAAAACCCCACAAACC +CCATTACTAAACCCACACTCAACAGAAACAAAGCATACATCATTATTCTCGCACGGACTACAACCACGAC +CAATGATATGAAAAACCATCGTTGTATTTCAACTACAAGAACACCAATGACCCCAATACGCAAAACTAAC +CCCCTAATAAAATTAATTAACCACTCATTCATCGACCTCCCCACCCCATCCAACATCTCCGCATGATGAA +ACTTCGGCTCACTCCTTGGCGCCTGCCTGATCCTCCAAATCACCACAGGACTATTCCTAGCCATGCACTA +CTCACCAGACGCCTCAACCGCCTTTTCATCAATCGCCCACATCACTCGAGACGTAAATTATGGCTGAATC +ATCCGCTACCTTCACGCCAATGGCGCCTCAATATTCTTTATCTGCCTCTTCCTACACATCGGGCGAGGCC +TATATTACGGATCATTTCTCTACTCAGAAACCTGAAACATCGGCATTATCCTCCTGCTTGCAACTATAGC +AACAGCCTTCATAGGCTATGTCCTCCCGTGAGGCCAAATATCATTCTGAGGGGCCACAGTAATTACAAAC +TTACTATCCGCCATCCCATACATTGGGACAGACCTAGTTCAATGAATCTGAGGAGGCTACTCAGTAGACA +GTCCCACCCTCACACGATTCTTTACCTTTCACTTCATCTTGCCCTTCATTATTGCAGCCCTAGCAACACT +CCACCTCCTATTCTTGCACGAAACGGGATCAAACAACCCCCTAGGAATCACCTCCCATTCCGATAAAATC +ACCTTCCACCCTTACTACACAATCAAAGACGCCCTCGGCTTACTTCTCTTCCTTCTCTCCTTAATGACAT +TAACACTATTCTCACCAGACCTCCTAGGCGACCCAGACAATTATACCCTAGCCAACCCCTTAAACACCCC +TCCCCACATCAAGCCCGAATGATATTTCCTATTCGCCTACACAATTCTCCGATCCGTCCCTAACAAACTA +GGAGGCGTCCTTGCCCTATTACTATCCATCCTCATCCTAGCAATAATCCCCATCCTCCATATATCCAAAC +AACAAAGCATAATATTTCGCCCACTAAGCCAATCACTTTATTGACTCCTAGCCGCAGACCTCCTCATTCT +AACCTGAATCGGAGGACAACCAGTAAGCTACCCTTTTACCATCATTGGACAAGTAGCATCCGTACTATAC +TTCACAACAATCCTAATCCTAATACCAACTATCTCCCTAATTGAAAACAAAATACTCAAATGGGCCTGTC +CTTGTAGTATAAACTAATACACCAGTCTTGTAAACCGGAGATGAAAACCTTTTTCCAAGGACAAATCAGA +GAAAAAGTCTTTAACTCCACCATTAGCACCCAAAGCTAAGATTCTAATTTAAACTATTCTCTGTTCTTTC +ATGGGGAAGCAGATTTGGGTACCACCCAAGTATTGACTCACCCATCAACAACCGCTATGTATTTCGTACA +TTACTGCCAGCCACCATGAATATTGTACGGTACCATAAATACTTGACCACCTGTAGTACATAAAAACCCA +ATCCACATCAAAACCCCCTCCCCATGCTTACAAGCAAGTACAGCAATCAACCCTCAACTATCACACATCA +ACTGCAACTCCAAAGCCACCCCTCACCCACTAGGATACCAACAAACCTACCCACCCTTAACAGTACATAG +TACATAAAGCCATTTACCGTACATAGCACATTACAGTCAAATCCCTTCTCGTCCCCATGGATGACCCCCC +TCAGATAGGGGTCCCTTGACCACCATCCTCCGTGAAATCAATATCCCGCACAAGAGTGCTACTCTCCTCG +CTCCGGGCCCATAACACTTGGGGGTAGCTAAAGTGAACTGTATCCGACATCTGGTTCCTACTTCAGGGTC +ATAAAGCCTAAATAGCCCACACGTTCCCCTTAAATAAGACATCACGATG diff -r 000000000000 -r 7653ebd919bb test-data/meme_fimo_input_1.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_fimo_input_1.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,8739 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +]> + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +0.294 +0.209 +0.164 +0.333 + + + + +meme meme_inputx.fa -o meme_outx -dna +ThinkPad-T450s +zoops +1 +inf +E-value of product of p-values +0 +8 +50 +11 +1 +yes +yes +2 +1000 +0.8 +uni +0.5 +dirichlet +0.01 +50 +1e-05 +1000 +80981 +0 +-1 +-1 +forward + +Stopped because requested number of motifs (1) found. + + +0.294 +0.209 +0.164 +0.333 + + + + + + + + +-67 +-58 +-1545 +102 + + +173 +-1545 +-262 +-1545 + + +-1545 +189 +-1545 +-57 + + +-1545 +-1545 +-1545 +159 + + +177 +-1545 +-1545 +-1545 + + +177 +-1545 +-1545 +-1545 + + +-1545 +166 +-1545 +1 + + +83 +35 +-1545 +-67 + + + + + + +0.184855 +0.140312 +0.000000 +0.674833 + + +0.973274 +0.000000 +0.026726 +0.000000 + + +0.000000 +0.775056 +0.000000 +0.224944 + + +0.000000 +0.000000 +0.000000 +1.000000 + + +1.000000 +0.000000 +0.000000 +0.000000 + + +1.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.663697 +0.000000 +0.336303 + + +0.523385 +0.267261 +0.000000 +0.209354 + + + + +TA[CT]TAA[CT][ACT] + + + +TAC + + + + + + + + + + +ATATATTAGC + + +TGGCCTCATT + + + + + + + + + + +GATAAGTAGT + + +GTCTTTCATG + + + + + + + + + + +AGTTTTCAAA + + +TCTTGGCTTT + + + + + + + + + + +GTGATCAGTC + + +CCCCCTCATG + + + + + + + + + + +CTCTTGTAGG + + +GTGACTCAGA + + + + + + + + + + +GCAATGTAGC + + + + + + + + + + + + + +TTTTGTGTAG + + +TAAATCCTCC + + + + + + + + + + +AAAAGTCTAT + + +TATTAACAAT + + + + + + + + + + +TCTTAGAGCA + + +AAATATCCCT + + + + + + + + + + +CACTGGGGAA + + +AGACCACACA + + + + + + + + + + +GTCGTCTTCA + + +GTTAATGAAA + + + + + + + + + + +AACCAGTGGT + + +CTAATATAAA + + + + + + + + + + +ATAG + + +ATTTACCTTT + + + + + + + + + + +CGCTTATTTG + + +CTCTGTTGTG + + + + + + + + + + +AAAATAGTTG + + +TCCCCACCCT + + + + + + + + + + +TTAACGAAAA + + +AGGCAGGGCC + + + + + + + + + + +GGGACCCAAG + + +AACAAAATTT + + + + + + + + + + +CAAATACTAA + + +ATTTTCTTTC + + + + + + + + + + +CCATA + + +CCAATGCTAT + + + + + + + + + + +ATATGGTTAC + + +CAGTGAAATG + + + + + + + + + + +CTGCTGCCTT + + +TTT + + + + + + + + + + +ATTTACACAT + + +CATTTTCCAT + + + + + + + + + + +GCATCCTAAT + + +ATTGCTTTAT + + + + + + + + + + +CCTGGAACAG + + +ATGTATA + + + + + + + + + + +GAAATAAAAT + + +ACCATGTATA + + + + + + + + + + +GAAATAAAAT + + +CATTGAACAT + + + + + + + + + + +AGCCTGGGCT + + +AATTGTATGG + + + + + + + + + + +ACTAGAGTAC + + +TTGGGACTGT + + + + + + + + + + +GTGCTGTTTA + + +CACT + + + + + + + + + + +ATATTTATTG + + +TCCTACTGAC + + + + + + + + + + +AATATAAAAT + + +TTGTGA + + + + + + + + + + +GCTGCCAGCA + + +AGACCACACA + + + + + + + + + + +GTCGTCTTCA + + +TGTCGGTATA + + + + + + + + + + +GTTTAATATT + + +ATGACCCATT + + + + + + + + + + +GGCAACAAGC + + +AACC + + + + + + + + + + +TGGATTGGTT + + + + + + + + + + + + + +TTTGTATTAA + + +ATTTAATACT + + + + + + + + + + +ACAGAGATAC + + +GTTGTCTCCT + + + + + + + + + + +ATATTCTGCC + + +AAAAAAATAT + + + + + + + + + + +TGTCTTTTGC + + +AATAGAAAAT + + + + + + + + + + +ATATCTAACA + + +ATGTGAAAGT + + + + + + + + + + +TTTATTATGT + + +CAATAGTGCT + + + + + + + + + + +CTTGACAGTA + + +ACCCCATCTC + + + + + + + + + + +TGGAGAAACC + + +AACTAACTAA + + + + + + + + + + +TCTCAGACGC + + +TAAA + + + + + + + + + + +TTGTATCCAT + + +AGTGGTTATA + + + + + + + + + + +TTGTTTGATG + + +TTTCACCTAT + + + + + + + + + + +TTATTATGGC + + +ATTACACCAT + + + + + + + + + + +CTCAAACACA + + +GAAGAGAATA + + + + + + + + + + +TGGGAAAAAG + + +TTTACATTTT + + + + + + + + + + +TTTGCGTTGT + + +TAGTACTTAT + + + + + + + + + + +GTAGTTATTT + + +AAAATCACTG + + + + + + + + + + +AGATTTGAAA + + +TGAAACCCAA + + + + + + + + + + +TAATTATAGT + + +CTACAATGTC + + + + + + + + + + +TGTCCTAGCC + + +TTAG + + + + + + + + + + +ACAATCCTTT + + +CTGCTGGTAT + + + + + + + + + + +TAGTTTACTC + + + + + + + + + + + + + +ATAACGGATT + + +CATTTTAAAG + + + + + + + + + + +TTTGGCCACA + + +CCCAAATTA + + + + + + + + + + +GCTCATAATT + + +TCATTTAACA + + + + + + + + + + +TCTGTAATTG + + +C + + + + + + + + + + +TCCTTTCTCT + + +TAGCTCTCTA + + + + + + + + + + +CGTGTTACAA + + +ATTTACATAT + + + + + + + + + + +AAACTTAAAC + + +GC + + + + + + + + + + +CAAGTCTAGT + + +AACCACTAAC + + + + + + + + + + +TACTTCTTGC + + +TCAGTACTCT + + + + + + + + + + +ACCTGGTGCA + + +ACAACAACAT + + + + + + + + + + +TGTGGAGTCA + + +ATACTAGGCC + + + + + + + + + + +AACACACTAA + + +ATTC + + + + + + + + + + +TTTAAGGTGA + + +CATATGTGTA + + + + + + + + + + +ATACTCATCT + + +GCAATTGC + + + + + + + + + + +TATGATTAGA + + +TGTTGTTCAT + + + + + + + + + + +AACATCCCTT + + +ATGGCTTCCT + + + + + + + + + + +ATCCTTACTA + + +ACTCACATTC + + + + + + + + + + +CCATC + + +TCCCCTTGCT + + + + + + + + + + +CCTATTTAGA + + +GCAGTAGCAG + + + + + + + + + + +AGTCCAGTTG + + +GGGGTAACGA + + + + + + + + + + +AGTTCACCTA + + +AGTGG + + + + + + + + + + +AGTCCAGTTG + + +CTTAGTTTTC + + + + + + + + + + +AAAGAAAGAC + + +AGGAAAGTGT + + + + + + + + + + +TCTTGCACCC + + +GAATACTTTT + + + + + + + + + + +TCAGAGTCAA + + +AACTAAGCTA + + + + + + + + + + +CTAGGGTTCG + + +TAAAGTCAGC + + + + + + + + + + +TGGTACTATG + + +GCACTAGCCA + + + + + + + + + + +AGTCCAGTTG + + +GCACTAGCAG + + + + + + + + + + +AATCCAGTTG + + +ATATTCTGGA + + + + + + + + + + +CCCTTATCAG + + +GCCTAGCACC + + + + + + + + + + +CTGAGAAAAT + + +GACTTCTCAC + + + + + + + + + + +CTGGAAACTT + + +GTTTCTTTAA + + + + + + + + + + +AGAATACCAT + + +TGATGACCTT + + + + + + + + + + +AAAACATACT + + +ACAACTATAA + + + + + + + + + + +CTTTTCTCAG + + +GTAAAGGGAT + + + + + + + + + + +TTAGCTCAGA + + +TACACATGTT + + + + + + + + + + +ATAGTAGTGA + + +TTCTGAGATG + + + + + + + + + + +TCTGCCAGAC + + +AGTAATT + + + + + + + + + + +CCCACTGTGG + + +CCTGGGGATA + + + + + + + + + + +AACTGAGTCT + + +TTAAACAGAC + + + + + + + + + + +ATAAGGGTAC + + +CCCCTCCTAA + + + + + + + + + + +ACCTGACTCC + + +GTGTGAAGAT + + + + + + + + + + +TCCAACACTC + + +CCCCCAACTC + + + + + + + + + + +TTCAGTCCTA + + +TTTGGGCACA + + + + + + + + + + +TACTAACTGT + + +ATATCACCCA + + + + + + + + + + +AAATTATGTC + + +TTTGGTATGT + + + + + + + + + + +GTTAAACAAA + + +CCCCCACACA + + + + + + + + + + +AACATGACAG + + +GGCT + + + + + + + + + + +ACAGCTTTTG + + +TACTGTGCTG + + + + + + + + + + +CCCAATGGTA + + +CCTTTCACCC + + + + + + + + + + +AATCTCCCTG + + +GTGCCCATC + + + + + + + + + + +TTGCTGGACT + + +TACCCAATAT + + + + + + + + + + +CCCTATCCCC + + +TTGTAAGTAG + + + + + + + + + + +TATACATTAT + + +GCTCAAATTG + + + + + + + + + + +TTGGCTAGTG + + +CATGAGGTTT + + + + + + + + + + +CAAAATATGT + + +TTGAGCTGCA + + + + + + + + + + +GTGGTGGGGT + + +TTCATCT + + + + + + + + + + +TCTAAAGTAT + + +CTATCTCACT + + + + + + + + + + +ACTATGGACA + + +TATGCTTCTT + + + + + + + + + + +GCATTTATGC + + +TTGTAA + + + + + + + + + + +TAATAGTGGG + + +AAG + + + + + + + + + + +TGGCTAGTAT + + +TTTACATTCT + + + + + + + + + + +GAGTATAAGC + + +AATGA + + + + + + + + + + +ATACACATAA + + +TTATGTTTAT + + + + + + + + + + +TTGTGAACAA + + +AAAATAATCT + + + + + + + + + + +TGATATTAGA + + +GAACT + + + + + + + + + + +TGCTAATAAG + + +ATTACTTATA + + + + + + + + + + +ACATAATGAC + + +GT + + + + + + + + + + +AAGCACATTG + + +AATTAATTTC + + + + + + + + + + +CAGATATTTA + + +ACCACTGGTT + + + + + + + + + + +GGGACCTTGT + + +AGAT + + + + + + + + + + +ACTTAGATTT + + +CTCAAATACT + + + + + + + + + + +ATAAAAGGGA + + +GTTAAAATTT + + + + + + + + + + +CACTTATCAG + + +TTCTTTCTCC + + + + + + + + + + +TTCCATCTGG + + +TGCTGATAAA + + + + + + + + + + +TTGTAACCCT + + +AGAATTAAAT + + + + + + + + + + +TAGGACTTCC + + +CTTGCTTTTT + + + + + + + + + + +ATGCGTCTCA + + +TAGAACTTT + + + + + + + + + + +CGTAGTCTTA + + +CATTC + + + + + + + + + + +TTTATTGGAC + + +CTGCTTAGCT + + + + + + + + + + +TCAGCTATTC + + +ACTGCTTAGT + + + + + + + + + + +CTTTTCATAT + + +TCAGTTATAC + + + + + + + + + + +TCTGCAGCCA + + +ATATTGTAAG + + + + + + + + + + +AAAT + + +ATGGCTTCA + + + + + + + + + + +TACATAGCCT + + +TAAATGTTTG + + + + + + + + + + +GACTTTAATT + + +CCCTTTAAGT + + + + + + + + + + +CCTAGAAATA + + +CTATATTTCA + + + + + + + + + + +CTTAGTGGAT + + +TTGTGAATAA + + + + + + + + + + +GTACTAATAA + + +ATTTGAAAGT + + + + + + + + + + +AACATCATAG + + +CCT + + + + + + + + + + +AAACTCTTAG + + +AAAAAGAAAT + + + + + + + + + + +TGTCAACCTT + + +CTCAGAAACA + + + + + + + + + + +GCACACGTTA + + +TGTGA + + + + + + + + + + +ATAGTTAACA + + +GTACATCCCA + + + + + + + + + + +ACTGACATAT + + +CTATTACA + + + + + + + + + + +TTCGTATCAG + + +GTGTTTTTTA + + + + + + + + + + +TCTATTATAA + + +C + + + + + + + + + + +TATGTTTTGA + + +TGATGTTTGA + + + + + + + + + + +TGAGCCCTGT + + +GAATAACAGC + + + + + + + + + + +TTTGAATAGC + + +AAACAAACCT + + + + + + + + + + +GCTAACCTGG + + +TAATGATAT + + + + + + + + + + +TTTGAGAGTG + + +TCACAT + + + + + + + + + + +TTTGTCCTTG + + +AAGAGTAAT + + + + + + + + + + +TTTCCCTTTT + + +ATTTTTCCAT + + + + + + + + + + +CTCTCTGTGT + + +ATAACTAAGA + + + + + + + + + + +ATGGGCTTGC + + +GCCATATGTG + + + + + + + + + + +ACTTGGAAGT + + +CTCCATTTTC + + + + + + + + + + +CTATACTGCT + + +TTTATATG + + + + + + + + + + +TTTGTTTAGG + + +ACTCTCCTAC + + + + + + + + + + +GTAAGCAATT + + +ACTAAGCTA + + + + + + + + + + +GTTAGGGTTG + + +TACCA + + + + + + + + + + +TTCAGTATCC + + +GCAAGAAGTA + + + + + + + + + + +CTTCGTCACT + + +TGAT + + + + + + + + + + +TGGTCAGGGG + + +AAAAACAAAA + + + + + + + + + + +TTTCAGCTTC + + +TT + + + + + + + + + + +ATCAAGAGTT + + +TTTAATC + + + + + + + + + + +AGGAAATTAA + + +TTTATAA + + + + + + + + + + +TTGGATGCAC + + +CTCTCTGGGT + + + + + + + + + + +TTTGAACTGA + + +TTCAT + + + + + + + + + + +TCTTAAAACT + + +TTTTTAGTAT + + + + + + + + + + +CTAGCCTGTA + + +TACTTTAATC + + + + + + + + + + +AGCAATAATA + + +GTTCGATGAC + + + + + + + + + + +GTTATAGCCA + + +TCAAACAAAA + + + + + + + + + + +TTGCGTGATT + + +GGGAGGTGAT + + + + + + + + + + +ATTCCATGCA + + +TGATAGATAA + + + + + + + + + + +CCATCGGCCT + + +CTGCTCTGCC + + + + + + + + + + +ACTCTTAAAA + + +CAAAGAAAA + + + + + + + + + + +ATACAAGCAC + + +AATCAGGT + + + + + + + + + + +TATTTAACTG + + +AAA + + + + + + + + + + +ATAACAATTA + + +ACAGTAGAGA + + + + + + + + + + +TACCTCATGT + + +CTCTATAGCT + + + + + + + + + + +TTTTCACACT + + +GACGCAGAAC + + + + + + + + + + +TTCCCATCTT + + +TTCTATGTGG + + + + + + + + + + +ATCTTCCTTC + + +CAAGTTAACG + + + + + + + + + + +AAATACATAA + + +GTCAGA + + + + + + + + + + +AAAATTACTT + + +CTGCTACCTC + + + + + + + + + + +CGTGAATGTT + + +TAATTGAAT + + + + + + + + + + +TAGTTGGTAT + + +TTTAACCAAA + + + + + + + + + + +TCTTTCTCTC + + +GTTCAGTTGT + + + + + + + + + + +TATTTTCAGC + + +AGTACTAAAA + + + + + + + + + + +CTGTAAGTCT + + +CTACTAC + + + + + + + + + + +ATAATAATAA + + +TGTTGACCAG + + + + + + + + + + +CCAGGAGTTC + + +ATGATCA + + + + + + + + + + +ATTTAATATT + + +TTTTGTCTGA + + + + + + + + + + +TTACTACAGC + + +CCATTGGAGA + + + + + + + + + + +ATGTTCCAAT + + +ATTTTGTCAT + + + + + + + + + + +ATTCTAACCA + + +TGAACT + + + + + + + + + + +TTCTGTTATG + + +ACACCTACTG + + + + + + + + + + +AGTTAACCAC + + +AAGAAATAGC + + + + + + + + + + +TTGATACCTT + + +AA + + + + + + + + + + +CTGGTTTAAA + + +AAAGCAAATA + + + + + + + + + + +CAGGGTTAAG + + +GTC + + + + + + + + + + +GAGATCTAAC + + +CCCATGCCAG + + + + + + + + + + +TCACCTCAAT + + +TAAAGTACCC + + + + + + + + + + +TTCCACCTGA + + +TAAGCCCCAT + + + + + + + + + + +TTTATATGGC + + +TGGTTTAACT + + + + + + + + + + +TTTAGCTTGG + + +GCAGGTCACC + + + + + + + + + + +AAACAACTGA + + +AAATATT + + + + + + + + + + +TTTAGTTTGA + + +TTCAACTTTT + + + + + + + + + + +GTTGTATCAA + + +AATTCATGGT + + + + + + + + + + +TGAACTGGAA + + +AAATGCCACC + + + + + + + + + + +GTGATCCAGC + + +GAGAGTACGT + + + + + + + + + + +TTCAGATTGG + + +TGCTGCAGTT + + + + + + + + + + +CAACCTA + + +CTCTC + + + + + + + + + + +TTTTTTCTGA + + +ATGAGTTTAA + + + + + + + + + + +CTTTCAGGTT + + +AGACATTCAA + + + + + + + + + + +TTGCTGGAAG + + +CATAGAACTA + + + + + + + + + + +TTCTCACAAA + + + + + + + + + + + + + +TTCTAATTAC + + +AATAACCATC + + + + + + + + + + +TACTTATAAT + + +GTCCCCTTCT + + + + + + + + + + +AAATTGTGTA + + +AA + + + + + + + + + + +AAGTAGAATA + + +ATTTAACCCC + + + + + + + + + + +CTCTACTTGA + + +TAATAATAAT + + + + + + + + + + +CTTACGTAGC + + +ATAGTCTCCT + + + + + + + + + + +TTCTGTCCAC + + +ATATTCAGAG + + + + + + + + + + +CAGATAAAAA + + +AACTAAAACA + + + + + + + + + + +CCAGCCTGAG + + +CTGTTTTCCT + + + + + + + + + + +TTTTTTTAAA + + +TTGTGATAGG + + + + + + + + + + +TTCCGTAGCT + + +GATAAAATGA + + + + + + + + + + +CCAATGCAGG + + +ATACATTTTC + + + + + + + + + + +TTTTTCCATC + + +AGTGTAATAC + + + + + + + + + + +CATTTCCTTT + + +CATCAGTGTA + + + + + + + + + + +CATTATCCTG + + +CTAACT + + + + + + + + + + +AAGAGTAGAG + + +AAGTTTTAGA + + + + + + + + + + +ACCAGTCCTC + + +TTCCCTACTC + + + + + + + + + + +ACTGGTATAA + + +AAAAAATCTT + + + + + + + + + + +TCCGGGTGAA + + +ATTTTCTTAC + + + + + + + + + + +ACCATCATCC + + +TTTCTAAAAG + + + + + + + + + + +TGACCTGATA + + +AATCCTGTTG + + + + + + + + + + +TCTCTGTCTC + + +T + + + + + + + + + + +TTTTCTTCTG + + +TAAATGTAAA + + + + + + + + + + +TATG + + +CCCCTAT + + + + + + + + + + +TATTACATTT + + +AATCAGGCAG + + + + + + + + + + +GTTTCTCTTT + + +GGAAGTGATC + + + + + + + + + + +TTCCTTTATA + + +TATA + + + + + + + + + + +TAAGTATTTT + + +TTTCCATACA + + + + + + + + + + +CTTTCAGTTC + + +TCAACTATTT + + + + + + + + + + +GCTGTTTACA + + +GTATTCTGTG + + + + + + + + + + +TTTATTGAGG + + +ATTAACATTT + + + + + + + + + + +TTATATGGAT + + +TTT + + + + + + + + + + +TCACCTGATT + + +CTTTAAGAAA + + + + + + + + + + +TTAAGCTTTT + + +CAATTAAGTT + + + + + + + + + + +TGTTGCCATA + + +TCCTGTTA + + + + + + + + + + +ACTAAGATAC + + +T + + + + + + + + + + +GATCTAAGTA + + +AATTACCTAA + + + + + + + + + + +AATCTTAAGC + + + + + + + + + + + + + +CTATTACCAT + + +TT + + + + + + + + + + +TTTTTCGTGT + + +TGCCCCCACA + + + + + + + + + + +CAGTTTCTGT + + +AATTAATCTT + + + + + + + + + + +ACAGTACCGC + + +GATAGATAAG + + + + + + + + + + +CCTCCAGGTC + + +CCTAAAGATC + + + + + + + + + + +ATGAATGGGT + + +ACT + + + + + + + + + + +TTTAGTTTGG + + +CAGAAGTATA + + + + + + + + + + +CAAACTCCCG + + +ACAACAGATC + + + + + + + + + + +ATTTCCTTAC + + +ATTTATCAAA + + + + + + + + + + +AAGTACACTT + + + + + + + + + + + + + +GTATATTTTA + + +AT + + + + + + + + + + +ATTGCCAATA + + +CTG + + + + + + + + + + +ATTAATTCTC + + +TG + + + + + + + + + + +TCTTATATCT + + +AGGTGATAAA + + + + + + + + + + +GTTTGAAGAC + + +TCCAGTA + + + + + + + + + + +GCATCTGAAA + + +TTTTCCTTTG + + + + + + + + + + +ACTTGGCTGT + + +TAACTTAATG + + + + + + + + + + +TAATTTAGGG + + +TTTATTGAT + + + + + + + + + + +CTGTGCCAGA + + +TACTGGTT + + + + + + + + + + +TCAAGCAGTT + + +TAAATGTAAA + + + + + + + + + + +TATGCTTGCA + + +TAAGTAGTAT + + + + + + + + + + +CTATTTACAG + + +CAATATCAAC + + + + + + + + + + +TTCCCTCTAC + + +TCATACAGCT + + + + + + + + + + +TTTGTCTGTC + + +ATTGGCATGC + + + + + + + + + + +ACTGCTGTAG + + +ATGATTTACC + + + + + + + + + + +AACCTCTCTT + + +TAAGTTACAT + + + + + + + + + + +AAAAC + + +TTTGTCTGTT + + + + + + + + + + +TTTATATGTT + + +TCCAGTTACC + + + + + + + + + + +CAGGTCAAGA + + +TTCTGTTAGC + + + + + + + + + + +TGTTAACAGC + + +CTAACCATAA + + + + + + + + + + +CCAACTACAA + + +CTAACCATAA + + + + + + + + + + +CCAACTACAA + + +AGGTATCTAC + + + + + + + + + + +TTGGAATAGT + + +TTTCCATAGA + + + + + + + + + + +ACAAAAGATA + + +CTCTGAATCC + + + + + + + + + + +CAAGACATGG + + +CTGCTT + + + + + + + + + + +TTAAATTTTG + + +GCATGAAAAG + + + + + + + + + + +T + + +TAGATGCTAA + + + + + + + + + + +GGGGTTGATG + + +GGTTGCAGCC + + + + + + + + + + +TGATTGTACA + + +ACCTATAAAA + + + + + + + + + + +CTCAGGTGGG + + +ATTTTTTTCT + + + + + + + + + + +CTGTCACCCA + + +TCATACTCTC + + + + + + + + + + +ACTGAGTTTA + + +CTAACACAAC + + + + + + + + + + +TGTTGAAATA + + +ATAGTGGCCA + + + + + + + + + + +TGCATTCCTA + + +CTCTTTGCAG + + + + + + + + + + +TCTAATGTAG + + +TAGAGAAGGT + + + + + + + + + + +TTCCCGAAGT + + +CAGAT + + + + + + + + + + +TATTCCAAAG + + +ACT + + + + + + + + + + +TTCTGATCTT + + +TGCTGTTGTC + + + + + + + + + + +CTATCATCTG + + +TAAT + + + + + + + + + + +CATGCCCCAG + + +TAGAATTCTT + + + + + + + + + + +GTGCTTGGTT + + +TTTTCCTGAA + + + + + + + + + + +ATCTTCTCTC + + +GTGTACTAAG + + + + + + + + + + +CATCCCAAAA + + +TCTTGTTAAC + + + + + + + + + + +TATACAGCCA + + +AACTGAATGT + + + + + + + + + + +CCTCAATAAA + + +AACTTTAGCC + + + + + + + + + + +TTAGCATCCA + + +ACAACTG + + + + + + + + + + +CTATCATTTG + + + + + + + + + + + + + +AAATTCAGCT + + +TTTTCCAGCA + + + + + + + + + + +TTTAGGTCAC + + +TAAGC + + + + + + + + + + +CTCTGTCTCT + + +ATATTACAAA + + + + + + + + + + +AATATTCATA + + +CTCACAACAA + + + + + + + + + + +AATACTAGTA + + +TTT + + + + + + + + + + +TTTCTACTTG + + +GGGGTAATGT + + + + + + + + + + +ATGCAATGTC + + +GTTGAGGAAC + + + + + + + + + + +TAAGAAAAAT + + +CCATTACT + + + + + + + + + + +TTCAAAATAA + + +AATGCCTGAT + + + + + + + + + + +TTAACAACAG + + +C + + + + + + + + + + +TAATATAGTG + + +TAAATCTTAA + + + + + + + + + + +CAAGTAAAAA + + +CACTGT + + + + + + + + + + +ATTGAACTTC + + +GTGACAGAGC + + + + + + + + + + +AACTAACTAA + + +TTTTAAATTG + + + + + + + + + + +GACATGTTTG + + +AACTAATTCC + + + + + + + + + + +CCTTAAGAGT + + + + + + + + + + + + + +TGTAACAATA + + +ACAAGGGAGG + + + + + + + + + + +ACACATGTGT + + +CCCCTCCCTG + + + + + + + + + + +TCTGCACTCT + + +ATTCTTTAAG + + + + + + + + + + +GAATGTACTG + + +TAACTTTCTC + + + + + + + + + + +TTCCCCTGCT + + +T + + + + + + + + + + +CAAATGCTAA + + +GAATTAATAA + + + + + + + + + + +TCTCGGGTGA + + +GATTTGCTT + + + + + + + + + + +ATTTGGCTTG + + +AATGGGCTAA + + + + + + + + + + +GCCACGAACC + + +TCTTTTATT + + + + + + + + + + +TACTGTAGAG + + +ATTTTTTCTT + + + + + + + + + + +CTTCACTTAA + + +GTTCATGGAA + + + + + + + + + + +TAATGTTAAC + + +TTTAAAAAAT + + + + + + + + + + +TTAGGGGAAA + + +TTAAAAAT + + + + + + + + + + +TAGGCAACTT + + +CAAATCGGGA + + + + + + + + + + +TTCTATAGGC + + +TTAATAAC + + + + + + + + + + +TTTATTGCAT + + +ATCCAATGCA + + + + + + + + + + +TAATCAGTCT + + +TATTAACTTC + + + + + + + + + + +TTTCTATAAC + + +GCCAACTTCA + + + + + + + + + + +ATACTGTATA + + +CTGGAAGTTA + + + + + + + + + + +TCGGCTGTAG + + +ACACCTAGAA + + + + + + + + + + +CTTCCTTAGT + + +CTTCTAAA + + + + + + + + + + +TTCCAGTGTT + + +TAATTGTGTA + + + + + + + + + + +AAGACCTGAG + + +ACTAAG + + + + + + + + + + +CTTTCATTGT + + +GCATTTCCCA + + + + + + + + + + +TTTAGCTCTC + + +CATGATAACC + + + + + + + + + + +CA + + +CCCAGAGTCC + + + + + + + + + + +ATTACCAGGG + + +CCTAAGAAAC + + + + + + + + + + +T + + +AGCTAACTTC + + + + + + + + + + +CATTATCCTT + + +TTTTCTAACC + + + + + + + + + + +ACGGTTCTGA + + +TAACAGTTAC + + + + + + + + + + +ATCCGGTAGA + + +TTTATAAGGG + + + + + + + + + + +CCATTCATGA + + +ATAGCAT + + + + + + + + + + +CATCCTTTAG + + +GTTGCATTCG + + + + + + + + + + +TATATGTAGT + + +TTACTTATAC + + + + + + + + + + +AAAAAGATTT + + +AGATAGATAG + + + + + + + + + + +TTTGTGAGAA + + + + + + + + + + + + + +ACATAATATT + + +TAATGTACTC + + + + + + + + + + +AATTGT + + +AATATGTCAT + + + + + + + + + + +ATAGTCAACA + + +TTCTACTTCC + + + + + + + + + + +ACTGCTCTCT + + +CTTTATTAAT + + + + + + + + + + +ACTTAGTCTA + + +TATCTGTTAG + + + + + + + + + + +CTACTCCTAC + + +ACTTAGCAAG + + + + + + + + + + +TATAAAGAAG + + +TATACTTCTT + + + + + + + + + + +AA + + +AC + + + + + + + + + + +TTCTATTGTA + + +GTATTCATAG + + + + + + + + + + +TTTTCTGGTA + + +TAAATGTCTT + + + + + + + + + + +ATCTACCTCC + + +CTTGCCTTCT + + + + + + + + + + +CCCCATTCTT + + +ATTGAACGTA + + + + + + + + + + +TTGATGTGTG + + +ATTCAATTCT + + + + + + + + + + +ACTCTGTGTG + + +AATATATATA + + + + + + + + + + +ACTCTGTCAC + + +GGCTTTATCT + + + + + + + + + + +CAGTCCCCAC + + +CTTATCTACC + + + + + + + + + + +CTTGTTAGAG + + +TTAACTCCAC + + + + + + + + + + +TATTCTAATT + + +TATTTGAATG + + + + + + + + + + +ATGGCATGTA + + +TTTTACT + + + + + + + + + + +TGGACACTGG + + +TTTATAAAGT + + + + + + + + + + +TGATCAGGGA + + +CCCTAAACCT + + + + + + + + + + +ATGCCTCATG + + +TACATGAAAA + + + + + + + + + + +ACATAATATT + + +CTGTTTAAAA + + + + + + + + + + +CACATAAATT + + +ATCATTAATA + + + + + + + + + + +AGAAAAATTG + + +TATATGAAAT + + + + + + + + + + +AACTTTCAG + + +ACCCCTCTT + + + + + + + + + + +TACTTGCTTC + + +GGAGTATACA + + + + + + + + + + +CATGTAAAGT + + +TGCTCTAATA + + + + + + + + + + +CTTTACTTAT + + +ATTC + + + + + + + + + + +TGAAAGTAGA + + +CCTCACCACT + + + + + + + + + + +GTATCTCCTC + + +A + + + + + + + + + + +TTTGTTATTC + + +TGAATCGGAA + + + + + + + + + + +TTAACACAAA + + +TCCTCTTCTT + + + + + + + + + + +CCTGTGCCTT + + +GCCTTAATTT + + + + + + + + + + +TATGCTATCA + + +CCATTGTCTC + + + + + + + + + + +GGCAGTGTTG + + +GTTCATTTT + + + + + + + + + + +CTTTAGCTCT + + +TGAACTTTGC + + + + + + + + + + +ATTGTTGATT + + +AGACTTAAGG + + + + + + + + + + +AAGGAGCAGG + + +AA + + + + + + + + + + +ACACTAATTT + + +ATCTTTTTTC + + + + + + + + + + +TATAGTTATG + + +CTTCTCT + + + + + + + + + + +TATAACTTCT + + +CCTAGAGTAA + + + + + + + + + + +ATTCTGCCCA + + +TTGAATCATA + + + + + + + + + + +ACAAATGGAT + + +TTTGTTTAGT + + + + + + + + + + +CCTCTAGCTC + + +CTCTCTTAAT + + + + + + + + + + +TTATAGATTA + + +TTTCTGACTA + + + + + + + + + + +GTGTATATAG + + +ATACATAAGT + + + + + + + + + + +CTTTCTTGTT + + +TACCATCAAT + + + + + + + + + + +CTCACATATT + + +GCTCTTAACC + + + + + + + + + + +TTTCTTCTTT + + +TTAATGTATC + + + + + + + + + + +ATTCCACTTC + + +TAGCTT + + + + + + + + + + +AGTACTGACT + + +TGGTTGTACC + + + + + + + + + + +AATCTCTTTT + + +AATGTTAACT + + + + + + + + + + +CGGGTTCTGT + + +CC + + + + + + + + + + +TTAGACTTTC + + +CTTCTAACCA + + + + + + + + + + +CAGAACCCTT + + +CAATTAAATT + + + + + + + + + + +CACTTATTAG + + +CTATT + + + + + + + + + + +TCTCTTCATT + + +CTTCC + + + + + + + + + + +TTAAAACAAA + + +TCATCCCTCT + + + + + + + + + + +ATCATCCTAG + + +GATATAATTT + + + + + + + + + + +ATAAGAACTT + + + + + + + + + + + + + +TTTTCTCTGT + + +TACTGTCTTG + + + + + + + + + + +TCTTCCTAAC + + +CCAACCCTAA + + + + + + + + + + +ATAACCCTAA + + +TTAAACCCCA + + + + + + + + + + +ATTGCTCTTG + + +TTTTCTTCT + + + + + + + + + + +CTCCCTTTTC + + +GCTGGCACTG + + + + + + + + + + +ACTTAACATG + + +ATAAACTTCC + + + + + + + + + + +TTCCCTAAAC + + +TACTATATGC + + + + + + + + + + +CTAACAGCTC + + +TCCCAGCCTC + + + + + + + + + + +AT + + +TGAAGGCAGT + + + + + + + + + + +CTATATGAAC + + +TAACCTTTAG + + + + + + + + + + +TAAACCTCCT + + +GCTTTCTTTT + + + + + + + + + + +TTGGAATGAT + + +CTTTT + + + + + + + + + + +ATTTTAAGCT + + +TAAATGTA + + + + + + + + + + +TTTTAAGGTC + + +CCAATTAATT + + + + + + + + + + +AATTTATTGG + + +GAACTAGTAG + + + + + + + + + + +CAGGGAGCTC + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 7653ebd919bb test-data/meme_input_1.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_input_1.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,66 @@ +>chr21_19617074_19617124_+ +AAAAATTATTACTAGGGAGGGGGCCGGAACCTCGGGACGTGGGTATATAA +>chr21_26934381_26934431_+ +GCGCCTGGTCGGTTATGAGTCACAAGTGAGTTATAAAAGGGTCGCACGTT +>chr21_28217753_28217803_- +CAAAGGGGAGGAGTGGGGTGGGGGTGGGGGTTTCACTGGTCCACTATAAA +>chr21_31710037_31710087_- +AACACCCAGGTTTCTGAGTATATAATCGCCGCACCAAAGAATTTAATTTT +>chr21_31744582_31744632_- +CCCAGGTCTAAGAGCATATATAACTTGGAGTCCAGACTATGACATTCAAA +>chr21_31768316_31768366_+ +AACGTATATAAATGGTCCTGTCCAGATGTGGCATGCAAACTCAGAATCTT +>chr21_31914206_31914256_- +TGACACCCACTACTTAGAGTATAAAATCATTCTGAGAAGTTAGAGACACC +>chr21_31933633_31933683_- +TCAGAGTATATATAAATGTTCCTGTCCAGTCACAGTCACCAAACTGACCT +>chr21_31962741_31962791_- +ACATATAACTCAGGTTGGATAAAATAATTTGTACAAATCAGGAGAGTCAA +>chr21_31964683_31964733_+ +TCTGATTCACTGAGGCATATAAAAGGCCCTCTGCGGAGAAGTGTCCATAC +>chr21_31973364_31973414_+ +aaacttaaaactctataaacttaaaactCTAGAATCTGATCCTGCTATAC +>chr21_31992870_31992920_+ +CTCATACACTATTGAAGATGTATAAAATTTCATTTGCAGATGGTGACATT +>chr21_32185595_32185645_- +TCACCACCCACCAGAGCTGGGATATATAAAGAAGGTTCTGAGACTAGGAA +>chr21_32202076_32202126_- +TGCCCACCAGCTTGAGGTATAAAAAGCCCTGTACGGGAAGAGACCTTCAT +>chr21_32253899_32253949_- +AGCCCCACCCACCAGCAAGGATATATAAAAGCTCAGGAGTCTGGAGTGAC +>chr21_32410820_32410870_- +TCTACCCCACTAATCACTGAGGATGTATAAAAGTCCCAGGGAAGCTGGTG +>chr21_36411748_36411798_- +ATAGTTCTGTATAGTTTCAGTTGGCATCtaaaaattatataactttattt +>chr21_37838750_37838800_- +gatggttttataaggggcctcaccctcggctcagccctcattcttctcct +>chr21_45705687_45705737_+ +CCGGGGCGGAGCGGCCTTTGCTCTTTGCGTGGTCGCGGGGGTATAACAGC +>chr21_45971413_45971463_- +CAGGCCCTGGGCATATAAAAGCCCCAGCAGCCAACAGGctcacacacaca +>chr21_45978668_45978718_- +CAGAGGGGTATAAAGGTTCCGACCACTCAGAGGCCTGGCACGAtcactca +>chr21_45993530_45993580_+ +CCAAGGAGGAGTATAAAAGCCCCACAAACCCGAGCACCTCACTCACTCGC +>chr21_46020421_46020471_+ +GAGACATATAAAAGCCAACATCCCTGAGCACCTAACACACGGactcactc +>chr21_46031920_46031970_+ +GGAAAATACCCAGGGAGGGTATAAAACCTCAGCAGCCAGGGCACACAAAC +>chr21_46046964_46047014_+ +ACAAGGCCAGGAGGGGTATAAAAGCCTGAGAGCCCCAAGAACctcacaca +>chr21_46057197_46057247_+ +ATTGCTGAGTCTCCTGCTGGGAAAACACAGGCCCTGGGCATATAAAAGCC +>chr21_46086869_46086919_- +GACAGGTGTGCTTCTGTGCTGTGGGGATGCCTGGGCCCAGGTATAAAGGC +>chr21_46102103_46102153_- +AGGTGTGTGCTTCTGTGCTGTGGGGATGCCTGGGTCCAGGTATAAAGGCT +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG diff -r 000000000000 -r 7653ebd919bb test-data/meme_input_m.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_input_m.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,66 @@ +>chr21_19617074_19617124_+ +AAAAATTATTACTAGGGAGGGGGCCGGAACCTCGGGACGTGGGTATATAA +>chr21_26934381_26934431_+ +GCGCCTGGTCGGTTATGAGTCACAAGTGAGTTATAAAAGGGTCGCACGTT +>chr21_28217753_28217803_- +CAAAGGGGAGGAGTGGGGTGGGGGTGGGGGTTTCACTGGTmCACTATAAA +>chr21_31710037_31710087_- +AACACCCAGGTTTCTGAGTATATAATCGCCGCACCAAAGAATTTAATTTT +>chr21_31744582_31744632_- +CCmAGGTCTAAGAGCATATATAACTTGGAGTCCAGACTATGACATTCAAA +>chr21_31768316_31768366_+ +AACGTATATAAATGGTCCTGTCCAGATGTGGCATGCAAACTmAGAATCTT +>chr21_31914206_31914256_- +TGACACCCACTACTTAGAGTATAAAATCATTCTGAGAAGTTAGAGACACC +>chr21_31933633_31933683_- +TCAGAGTATATATAAATGTTCCTGTCCAGTCACAGTCACCAAACTGACCT +>chr21_31962741_31962791_- +ACATATAACTCAGGTTGGATAAAATAATTTGTACAAATCAGGAGAGTCAA +>chr21_31964683_31964733_+ +TCTGATTCACTGAGGCATATAAAAGGCCCTCTGCGGAGAAGTGTCCATAC +>chr21_31973364_31973414_+ +aaacttaaaactctataaacttaaaactCTAGAATCTGATCCTGCTATAC +>chr21_31992870_31992920_+ +CTCATACACTATTGAAGATGTATAAAATTTCATTTGCAGATGGTGACATT +>chr21_32185595_32185645_- +TCACCACCCACCAGAGCTGGGATATATAAAGAAGGTTCTGAGACTAGGAA +>chr21_32202076_32202126_- +TGCCCACCAGCTTGAGGTATAAAAAGCCCTGTACGGGAAGAGACCTTCAT +>chr21_32253899_32253949_- +AGCCCCACCCACCAGCAAGGATATATAAAAGCTCAGGAGTCTGGAGTGAC +>chr21_32410820_32410870_- +TCTACCCCACTAATCACTGAGGATGTATAAAAGTCCCAGGGAAGCTGGTG +>chr21_36411748_36411798_- +ATAGTTCTGTATAGTTTCAGTTGGCATCtaaaaattatataactttattt +>chr21_37838750_37838800_- +gatggttttataaggggcctcaccctcggctcagccctcattcttctcct +>chr21_45705687_45705737_+ +CCGGGGCGGAGCGGCCTTTGCTCTTTGCGTGGTCGCGGGGGTATAACAGC +>chr21_45971413_45971463_- +CAGGCCCTGGGCATATAAAAGCCCCAGCAGCCAACAGGctcacacacaca +>chr21_45978668_45978718_- +CAGAGGGGTATAAAGGTTCCGACCACTCAGAGGCCTGGCACGAtcactca +>chr21_45993530_45993580_+ +CCAAGGAGGAGTATAAAAGCCCCACAAACCCGAGCACCTCACTCACTCGC +>chr21_46020421_46020471_+ +GAGACATATAAAAGCCAACATCCCTGAGCACCTAACACACGGactcactc +>chr21_46031920_46031970_+ +GGAAAATACCCAGGGAGGGTATAAAACCTCAGCAGCCAGGGCACACAAAC +>chr21_46046964_46047014_+ +ACAAGGCCAGGAGGGGTATAAAAGCCTGAGAGCCCCAAGAACctcacaca +>chr21_46057197_46057247_+ +ATTGCTGAGTCTCCTGCTGGGAAAACACAGGCCCTGGGCATATAAAAGCC +>chr21_46086869_46086919_- +GACAGGTGTGCTTCTGTGCTGTGGGGATGCCTGGGCCCAGGTATAAAGGC +>chr21_46102103_46102153_- +AGGTGTGTGCTTCTGTGCTGTGGGGATGCCTGGGTCCAGGTATAAAGGCT +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGmGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGmTGCCGGTGAGCGTATAAAGGCCCTGGCG +>chr21_47575506_47575556_- +TGAGAAGCmGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_custom.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_custom.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,276 @@ + "options": { + "mod": "zoops", + "revcomp": false, + "nmotifs": 1, + "objfun": "E-value of product of p-values", + "spfun": "E-value of product of p-values", + "minw": 8, + "maxw": 50, + "minsites": 2, + "maxsites": 30, + "wnsites": 0.8, + "spmap": "uni", + "spfuzz": 0.5, + "searchsize": 1500, + "maxsize": 1000000, + "norand": "no", + "csites": 1000, + "hsfrac": 0, + "prior": "dirichlet", + "b": 0.01, + "maxiter": 50, + "distance": 0.001, + "wg": 11, + "ws": 1, + "noendgaps": false, + "substring": true, + "seed": 0, + "brief": 1000 + }, + "alphabet": { + "name": "DNA with covalent modifications", + "like": "dna", + "ncore": 16, + "symbols": [ + { + "symbol": "A", + "name": "Adenine", + "colour": "8510A8", + "complement": "T" + }, { + "symbol": "C", + "name": "Cytosine", + "colour": "A50026", + "complement": "G" + }, { + "symbol": "G", + "name": "Guanine", + "colour": "313695", + "complement": "C" + }, { + "symbol": "T", + "name": "Thymine", + "colour": "A89610", + "complement": "A" + }, { + "symbol": "a", + "name": "N6-methyladenine", + "colour": "8510A8", + "complement": "t" + }, { + "symbol": "c", + "name": "5-Carboxylcytosine", + "colour": "FEE090", + "complement": "4" + }, { + "symbol": "f", + "name": "5-Formylcytosine", + "colour": "FDAE61", + "complement": "3" + }, { + "symbol": "g", + "name": "modified_g", + "colour": "00897B", + "complement": "5" + }, { + "symbol": "h", + "name": "5-Hydroxymethylcytosine", + "colour": "F46D43", + "complement": "2" + }, { + "symbol": "m", + "name": "5-Methylcytosine", + "colour": "D73027", + "complement": "1" + }, { + "symbol": "t", + "name": "Thymine_lowercase", + "colour": "756BB1", + "complement": "a" + }, { + "symbol": "1", + "name": "Guanine:5-Methylcytosine", + "colour": "4575B4", + "complement": "m" + }, { + "symbol": "2", + "name": "Guanine:5-Hydroxymethylcytosine", + "colour": "74ADD1", + "complement": "h" + }, { + "symbol": "3", + "name": "Guanine:5-Formylcytosine", + "colour": "ABD9E9", + "complement": "f" + }, { + "symbol": "4", + "name": "Guanine:5-Carboxylcytosine", + "colour": "E0F3F8", + "complement": "c" + }, { + "symbol": "5", + "name": "cytosine_lowercase", + "colour": "53698A", + "complement": "g" + }, { + "symbol": "?", + "equals": "ACGTacfghmt12345" + } + ] + }, + "background": { + "source": "--sequences--", + "order": 0, + "freqs": [ + 0.263, 0.2, 0.249, 0.189, 0.0297, 0.027, 0.00066, 0.00726, + 0.00066, 0.00396, 0.0277, 0.00066, 0.00066, 0.00066, 0.00066, + 0.00066 + ] + }, + "sequence_db": { + "primary_source": "Galaxy_FASTA_Input", + "primary_count": 30, + "primary_positions": 1500, + "control_source": "--none--", + "control_count": 0, + "control_positions": 0, + "freqs": [ + 0.265, 0.201, 0.251, 0.19, 0.0293, 0.0267, 0, 0.00667, 0, 0.00333, + 0.0273, 0, 0, 0, 0, 0 + ], + "sequences": [ + { + "name": "chr21_19617074_19617124_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_26934381_26934431_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_28217753_28217803_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31710037_31710087_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31744582_31744632_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31768316_31768366_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31914206_31914256_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31933633_31933683_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31962741_31962791_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31964683_31964733_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31973364_31973414_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31992870_31992920_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32185595_32185645_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32202076_32202126_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32253899_32253949_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32410820_32410870_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_36411748_36411798_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_37838750_37838800_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45705687_45705737_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45971413_45971463_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45978668_45978718_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45993530_45993580_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46020421_46020471_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46031920_46031970_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46046964_46047014_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46057197_46057247_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46086869_46086919_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46102103_46102153_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_47517957_47518007_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_47575506_47575556_-", + "length": 50, + "weight": 1.000000 + } + ] + }, + "motifs": [ + { + "db": 0, + "id": "taCaaACAGtataactctcac", + "alt": "MEME-1", + "len": 21, + "nsites": 5, + "evalue": "4.6e-028", + "ic": 55.7, + "re": 68.0, + "llr": 236, + "bt": 7.73664, \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_custom.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_custom.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,61 @@ +******************************************************************************** +MEME - Motif discovery tool +******************************************************************************** +MEME version 5.5.8 (Release date: Thu May 15 15:01:46 2025 -0700) + +For further information on how to interpret these results please access https://meme-suite.org/meme. +To get a copy of the MEME Suite software please access https://meme-suite.org. + +******************************************************************************** + + +******************************************************************************** +REFERENCE +******************************************************************************** +If you use this program in your research, please cite: + +Timothy L. Bailey and Charles Elkan, +"Fitting a mixture model by expectation maximization to +discover motifs in biopolymers", +Proceedings of the Second International Conference on Intelligent Systems +for Molecular Biology, pp. 28-36, AAAI Press, Menlo Park, California, 1994. +******************************************************************************** + + +******************************************************************************** +ALPHABET "DNA with covalent modifications" DNA-LIKE +******************************************************************************** +A "Adenine" 8510A8 ~ T "Thymine" A89610 +C "Cytosine" A50026 ~ G "Guanine" 313695 +a "N6-methyladenine" 8510A8 ~ t "Thymine_lowercase" 756BB1 +c "5-Carboxylcytosine" FEE090 ~ 4 "Guanine:5-Carboxylcytosine" E0F3F8 +f "5-Formylcytosine" FDAE61 ~ 3 "Guanine:5-Formylcytosine" ABD9E9 +g "modified_g" 00897B ~ 5 "cytosine_lowercase" 53698A +h "5-Hydroxymethylcytosine" F46D43 ~ 2 "Guanine:5-Hydroxymethylcytosine" 74ADD1 +m "5-Methylcytosine" D73027 ~ 1 "Guanine:5-Methylcytosine" 4575B4 +? = ACGTacfghmt12345 +******************************************************************************** + +******************************************************************************** +TRAINING SET +******************************************************************************** +PRIMARY SEQUENCES= Galaxy_FASTA_Input +CONTROL SEQUENCES= --none-- +Sequence name Weight Length Sequence name Weight Length +------------- ------ ------ ------------- ------ ------ +chr21_19617074_19617124_ 1.0000 50 chr21_26934381_26934431_ 1.0000 50 +chr21_28217753_28217803_ 1.0000 50 chr21_31710037_31710087_ 1.0000 50 +chr21_31744582_31744632_ 1.0000 50 chr21_31768316_31768366_ 1.0000 50 +chr21_31914206_31914256_ 1.0000 50 chr21_31933633_31933683_ 1.0000 50 +chr21_31962741_31962791_ 1.0000 50 chr21_31964683_31964733_ 1.0000 50 +chr21_31973364_31973414_ 1.0000 50 chr21_31992870_31992920_ 1.0000 50 +chr21_32185595_32185645_ 1.0000 50 chr21_32202076_32202126_ 1.0000 50 +chr21_32253899_32253949_ 1.0000 50 chr21_32410820_32410870_ 1.0000 50 +chr21_36411748_36411798_ 1.0000 50 chr21_37838750_37838800_ 1.0000 50 +chr21_45705687_45705737_ 1.0000 50 chr21_45971413_45971463_ 1.0000 50 +chr21_45978668_45978718_ 1.0000 50 chr21_45993530_45993580_ 1.0000 50 +chr21_46020421_46020471_ 1.0000 50 chr21_46031920_46031970_ 1.0000 50 +chr21_46046964_46047014_ 1.0000 50 chr21_46057197_46057247_ 1.0000 50 +chr21_46086869_46086919_ 1.0000 50 chr21_46102103_46102153_ 1.0000 50 +chr21_47517957_47518007_ 1.0000 50 chr21_47575506_47575556_ 1.0000 50 +******************************************************************************** \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_custom.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_custom.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,946 @@ + + +61 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +443 +-897 +-897 +-897 +-897 +-897 + + +-897 +0 +-31 +-897 +375 +-897 +-897 +-897 +-897 +-897 +285 +-897 +-897 +-897 +-897 +-897 + + +-897 +100 +-897 +-897 +375 +-897 +-897 +-897 +-897 +-897 +285 +-897 +-897 +-897 +-897 +-897 + + +-897 +0 +-897 +8 +433 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +61 +-897 +-897 +-897 +433 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +61 +-897 +-897 +-897 +375 +-897 +-897 +478 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +100 +-897 +-897 +-897 +288 +-897 +478 +-897 +-897 +285 +-897 +-897 +-897 +-897 +-897 + + +61 +-897 +-897 +-897 +-897 +-897 +-897 +478 +-897 +-897 +385 +-897 +-897 +-897 +-897 +-897 + + +-897 +0 +-31 +-897 +275 +288 +-897 +478 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-39 +-897 +-31 +-897 +-897 +288 +-897 +-897 +-897 +-897 +385 +-897 +-897 +-897 +-897 +-897 + + +-897 +0 +-897 +-897 +375 +388 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-31 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +485 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-31 +-897 +375 +388 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +507 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +275 +488 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +275 +388 +-897 +-897 +-897 +-897 +385 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +-897 +447 +-897 +-897 +-897 +-897 +385 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +375 +-897 +-897 +-897 +-897 +-897 +443 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +375 +447 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +375 +-897 +-897 +478 +-897 +-897 +385 +-897 +-897 +-897 +-897 +-897 + + +-897 +-897 +-897 +-897 +275 +388 +-897 +478 +-897 +-897 +285 +-897 +-897 +-897 +-897 +-897 + + + + + + +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.200000 +0.200000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.400000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.200000 +0.000000 +0.200000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.400000 +0.000000 +0.000000 +0.000000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.400000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.200000 +0.000000 +0.200000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.200000 +0.200000 +0.000000 +0.200000 +0.200000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.200000 +0.000000 +0.200000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.200000 +0.000000 +0.000000 +0.400000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.800000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.200000 +0.000000 +0.400000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +1.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.800000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.600000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.400000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.200000 +0.400000 +0.000000 +0.200000 +0.000000 +0.000000 +0.200000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + + + +[tA][aCGt][Cat][aCT][aA][Aag][Ccgt][Atg][CGacg][tAGc][acC][tG][acG]a[ca][cta][ct][ta][ca][atg][cagt] + + + +gatggttt + + + + + + + + + + + + + + + + + + + + + + + +ctcagccctc + + +AGTTGGCATC + + + + + + + + + + + + + + + + + + + + + + + +t + + +aaac + + + + + + + + + + + + + + + + + + + + + + + +actCTAGAAT + + +AAGCCCCAGC + + + + + + + + + + + + + + + + + + + + + + + +a + + +ATCCCTGAGC + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test1.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test1.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,124 @@ + "sequences": [ + { + "name": "chr21_19617074_19617124_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_26934381_26934431_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_28217753_28217803_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31710037_31710087_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31744582_31744632_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31768316_31768366_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31914206_31914256_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31933633_31933683_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31962741_31962791_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31964683_31964733_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31973364_31973414_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_31992870_31992920_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32185595_32185645_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32202076_32202126_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32253899_32253949_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_32410820_32410870_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_36411748_36411798_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_37838750_37838800_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45705687_45705737_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45971413_45971463_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45978668_45978718_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_45993530_45993580_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46020421_46020471_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46031920_46031970_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46046964_46047014_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46057197_46057247_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46086869_46086919_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_46102103_46102153_-", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_47517957_47518007_+", + "length": 50, + "weight": 1.000000 + }, { + "name": "chr21_47575506_47575556_-", + "length": 50, + "weight": 1.000000 + } + ] + }, \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test1.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test1.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,207 @@ +model: mod= zoops nmotifs= 1 evt= inf +objective function: em= E-value of product of p-values + starts= E-value of product of p-values +width: minw= 8 maxw= 50 +nsites: minsites= 2 maxsites= 30 wnsites= 0.8 +theta: spmap= pam spfuzz= 120 +em: prior= megap b= 7500 maxiter= 50 + distance= 1e-05 +trim: wg= 11 ws= 1 endgaps= yes +data: n= 1500 N= 30 +sample: seed= 0 hsfrac= 0 + searchsize= 1500 norand= no csites= 1000 +Dirichlet mixture priors file: prior30.plib +Letter frequencies in dataset: +A 0.294 C 0.231 D 0 E 0 F 0 G 0.257 H 0 I 0 K 0 +L 0 M 0 N 0 P 0 Q 0 R 0 S 0 T 0.217 V 0 +W 0 Y 0 +Background letter frequencies (from file dataset with add-one prior applied): +A 0.291 C 0.229 D 0.000658 E 0.000658 F 0.000658 G 0.255 H 0.000658 I 0.000658 K 0.000658 +L 0.000658 M 0.000658 N 0.000658 P 0.000658 Q 0.000658 R 0.000658 S 0.000658 T 0.215 V 0.000658 +W 0.000658 Y 0.000658 +Background model order: 0 +******************************************************************************** + + +******************************************************************************** +MOTIF GGGGTATAAAA MEME-1 width = 11 sites = 25 llr = 239 E-value = 2.4e-011 +******************************************************************************** +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 Description +-------------------------------------------------------------------------------- +Simplified A 2323:a:a8a8 +pos.-specific C ::3:::::::: +probability D ::::::::::: +matrix E ::::::::::: + F ::::::::::: + G 7746::::::1 + H ::::::::::: + I ::::::::::: + K ::::::::::: + L ::::::::::: + M ::::::::::: + N ::::::::::: + P ::::::::::: + Q ::::::::::: + R ::::::::::: + S ::::::::::: + T 1:2:a:a:2:: + V ::::::::::: + W ::::::::::: + Y ::::::::::: + + bits 10.6 + 9.5 + 8.5 + 7.4 +Relative 6.3 +Entropy 5.3 +(13.8 bits) 4.2 + 3.2 + 2.1 * ** + 1.1 ** ******** + 0.0 ----------- + +Multilevel GGGGTATAAAA +consensus AACA T +sequence + + +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 sites sorted by position p-value +-------------------------------------------------------------------------------- +Sequence name Start P-value Site +------------- ----- --------- ----------- +chr21_46046964_46047014_ 13 1.06e-06 AAGGCCAGGA GGGGTATAAAA GCCTGAGAGC +chr21_46057197_46057247_ 37 3.41e-06 ACAGGCCCTG GGCATATAAAA GCC +chr21_45971413_45971463_ 10 3.41e-06 CAGGCCCTG GGCATATAAAA GCCCCAGCAG +chr21_31964683_31964733_ 14 3.41e-06 GATTCACTGA GGCATATAAAA GGCCCTCTGC +chr21_45993530_45993580_ 8 4.00e-06 CCAAGGA GGAGTATAAAA GCCCCACAAA +chr21_32202076_32202126_ 14 5.01e-06 CCACCAGCTT GAGGTATAAAA AGCCCTGTAC +chr21_46031920_46031970_ 16 6.06e-06 ATACCCAGGG AGGGTATAAAA CCTCAGCAGC +chr21_32410820_32410870_ 22 8.67e-06 AATCACTGAG GATGTATAAAA GTCCCAGGGA +chr21_32185595_32185645_ 19 8.67e-06 CACCAGAGCT GGGATATATAA AGAAGGTTCT +chr21_31992870_31992920_ 17 8.67e-06 CACTATTGAA GATGTATAAAA TTTCATTTGC +chr21_46020421_46020471_ 3 1.21e-05 GA GACATATAAAA GCCAACATCC +chr21_47517957_47518007_ 33 1.59e-05 CCGGCGGGGC GGGGTATAAAG GGGGCGG +chr21_45978668_45978718_ 5 1.59e-05 CAGA GGGGTATAAAG GTTCCGACCA +chr21_31914206_31914256_ 16 1.68e-05 CCCACTACTT AGAGTATAAAA TCATTCTGAG +chr21_32253899_32253949_ 20 2.03e-05 CACCAGCAAG GATATATAAAA GCTCAGGAGT +chr21_31744582_31744632_ 13 3.06e-05 CAGGTCTAAG AGCATATATAA CTTGGAGTCC +chr21_19617074_19617124_ 40 3.06e-05 CCTCGGGACG TGGGTATATAA +chr21_45705687_45705737_ 38 3.82e-05 CGTGGTCGCG GGGGTATAACA GC +chr21_31768316_31768366_ 1 3.82e-05 . AACGTATATAA ATGGTCCTGT +chr21_47575506_47575556_ 31 4.02e-05 GCTGCCGGTG AGCGTATAAAG GCCCTGGCG +chr21_26934381_26934431_ 28 5.52e-05 AGTCACAAGT GAGTTATAAAA GGGTCGCACG +chr21_31710037_31710087_ 15 5.94e-05 CCCAGGTTTC TGAGTATATAA TCGCCGCACC +chr21_36411748_36411798_ 23 6.78e-05 AGTTTCAGTT GGCATCtaaaa attatataac +chr21_31933633_31933683_ 3 2.08e-04 TC AGAGTATATAT AAATGTTCCT +chr21_31962741_31962791_ 14 4.05e-04 TATAACTCAG GTTGGATAAAA TAATTTGTAC +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 block diagrams +-------------------------------------------------------------------------------- +SEQUENCE NAME POSITION P-VALUE MOTIF DIAGRAM +------------- ---------------- ------------- +chr21_46046964_46047014_ 1.1e-06 12_[1]_27 +chr21_46057197_46057247_ 3.4e-06 36_[1]_3 +chr21_45971413_45971463_ 3.4e-06 9_[1]_30 +chr21_31964683_31964733_ 3.4e-06 13_[1]_26 +chr21_45993530_45993580_ 4e-06 7_[1]_32 +chr21_32202076_32202126_ 5e-06 13_[1]_26 +chr21_46031920_46031970_ 6.1e-06 15_[1]_24 +chr21_32410820_32410870_ 8.7e-06 21_[1]_18 +chr21_32185595_32185645_ 8.7e-06 18_[1]_21 +chr21_31992870_31992920_ 8.7e-06 16_[1]_23 +chr21_46020421_46020471_ 1.2e-05 2_[1]_37 +chr21_47517957_47518007_ 1.6e-05 32_[1]_7 +chr21_45978668_45978718_ 1.6e-05 4_[1]_35 +chr21_31914206_31914256_ 1.7e-05 15_[1]_24 +chr21_32253899_32253949_ 2e-05 19_[1]_20 +chr21_31744582_31744632_ 3.1e-05 12_[1]_27 +chr21_19617074_19617124_ 3.1e-05 39_[1] +chr21_45705687_45705737_ 3.8e-05 37_[1]_2 +chr21_31768316_31768366_ 3.8e-05 [1]_39 +chr21_47575506_47575556_ 4e-05 30_[1]_9 +chr21_26934381_26934431_ 5.5e-05 27_[1]_12 +chr21_31710037_31710087_ 5.9e-05 14_[1]_25 +chr21_36411748_36411798_ 6.8e-05 22_[1]_17 +chr21_31933633_31933683_ 0.00021 2_[1]_37 +chr21_31962741_31962791_ 0.0004 13_[1]_26 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 in BLOCKS format +-------------------------------------------------------------------------------- +BL MOTIF GGGGTATAAAA width=11 seqs=25 +chr21_46046964_46047014_ ( 13) GGGGTATAAAA 1 +chr21_46057197_46057247_ ( 37) GGCATATAAAA 1 +chr21_45971413_45971463_ ( 10) GGCATATAAAA 1 +chr21_31964683_31964733_ ( 14) GGCATATAAAA 1 +chr21_45993530_45993580_ ( 8) GGAGTATAAAA 1 +chr21_32202076_32202126_ ( 14) GAGGTATAAAA 1 +chr21_46031920_46031970_ ( 16) AGGGTATAAAA 1 +chr21_32410820_32410870_ ( 22) GATGTATAAAA 1 +chr21_32185595_32185645_ ( 19) GGGATATATAA 1 +chr21_31992870_31992920_ ( 17) GATGTATAAAA 1 +chr21_46020421_46020471_ ( 3) GACATATAAAA 1 +chr21_47517957_47518007_ ( 33) GGGGTATAAAG 1 +chr21_45978668_45978718_ ( 5) GGGGTATAAAG 1 +chr21_31914206_31914256_ ( 16) AGAGTATAAAA 1 +chr21_32253899_32253949_ ( 20) GATATATAAAA 1 +chr21_31744582_31744632_ ( 13) AGCATATATAA 1 +chr21_19617074_19617124_ ( 40) TGGGTATATAA 1 +chr21_45705687_45705737_ ( 38) GGGGTATAACA 1 +chr21_31768316_31768366_ ( 1) AACGTATATAA 1 +chr21_47575506_47575556_ ( 31) AGCGTATAAAG 1 +chr21_26934381_26934431_ ( 28) GAGTTATAAAA 1 +chr21_31710037_31710087_ ( 15) TGAGTATATAA 1 +chr21_36411748_36411798_ ( 23) GGCATCTAAAA 1 +chr21_31933633_31933683_ ( 3) AGAGTATATAT 1 +chr21_31962741_31962791_ ( 14) GTTGGATAAAA 1 +// + +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 position-specific scoring matrix +-------------------------------------------------------------------------------- +log-odds matrix: alength= 20 w= 11 n= 1200 bayes= 5.33554 E= 2.4e-011 + -32 -680 91 77 7 138 -20 55 64 107 11 150 142 72 87 396 -148 221 -140 -36 + -11 -680 89 76 7 137 -21 55 63 107 10 149 141 71 87 396 -239 220 -140 -36 + -79 41 4 21 -7 44 -62 42 -5 99 0 99 138 52 42 399 -46 223 -173 -68 + 11 -677 48 47 -2 127 -43 46 27 101 3 124 138 60 62 397 -235 220 -160 -55 + -596 -820 12 -21 -53 -267 -74 37 16 44 -37 98 31 9 19 319 212 127 -193 -95 + 165 -261 70 110 77 -521 -4 147 95 201 90 121 124 91 107 425 -527 314 -95 8 + -838 -990 -89 -149 -151 -841 -161 -117 -113 -66 -209 -68 -69 -129 -91 111 221 -55 -255 -173 + 176 -858 -79 -103 -115 -717 -148 -95 -108 -17 -162 -61 -12 -95 -69 193 -737 52 -240 -153 + 134 -686 0 16 -12 -553 -68 44 -8 96 -9 88 124 41 36 384 11 216 -177 -71 + 165 -261 70 110 77 -521 -4 147 95 201 90 121 124 91 107 425 -527 314 -95 8 + 147 -614 89 129 93 -121 12 160 113 217 108 144 144 111 125 447 -241 332 -81 22 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 position-specific probability matrix +-------------------------------------------------------------------------------- +letter-probability matrix: alength= 20 w= 11 nsites= 25 E= 2.4e-011 + 0.240000 0.000000 0.000000 0.000000 0.000000 0.680000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.080000 0.000000 0.000000 0.000000 + 0.280000 0.000000 0.000000 0.000000 0.000000 0.680000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.040000 0.000000 0.000000 0.000000 + 0.160000 0.320000 0.000000 0.000000 0.000000 0.360000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.160000 0.000000 0.000000 0.000000 + 0.320000 0.000000 0.000000 0.000000 0.000000 0.640000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.040000 0.000000 0.000000 0.000000 + 0.000000 0.000000 0.000000 0.000000 0.000000 0.040000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.960000 0.000000 0.000000 0.000000 + 0.960000 0.040000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 + 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 1.000000 0.000000 0.000000 0.000000 + 1.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 + 0.760000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.240000 0.000000 0.000000 0.000000 + 0.960000 0.040000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 + 0.840000 0.000000 0.000000 0.000000 0.000000 0.120000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.040000 0.000000 0.000000 0.000000 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGGGTATAAAA MEME-1 regular expression +-------------------------------------------------------------------------------- +[GA][GA][GC][GA]TATA[AT]AA +-------------------------------------------------------------------------------- \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test1.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test1.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,979 @@ + +-32 +-680 +91 +77 +7 +138 +-20 +55 +64 +107 +11 +150 +142 +72 +87 +396 +-148 +221 +-140 +-36 + + +-11 +-680 +89 +76 +7 +137 +-21 +55 +63 +107 +10 +149 +141 +71 +87 +396 +-239 +220 +-140 +-36 + + +-79 +41 +4 +21 +-7 +44 +-62 +42 +-5 +99 +0 +99 +138 +52 +42 +399 +-46 +223 +-173 +-68 + + +11 +-677 +48 +47 +-2 +127 +-43 +46 +27 +101 +3 +124 +138 +60 +62 +397 +-235 +220 +-160 +-55 + + +-596 +-820 +12 +-21 +-53 +-267 +-74 +37 +16 +44 +-37 +98 +31 +9 +19 +319 +212 +127 +-193 +-95 + + +165 +-261 +70 +110 +77 +-521 +-4 +147 +95 +201 +90 +121 +124 +91 +107 +425 +-527 +314 +-95 +8 + + +-838 +-990 +-89 +-149 +-151 +-841 +-161 +-117 +-113 +-66 +-209 +-68 +-69 +-129 +-91 +111 +221 +-55 +-255 +-173 + + +176 +-858 +-79 +-103 +-115 +-717 +-148 +-95 +-108 +-17 +-162 +-61 +-12 +-95 +-69 +193 +-737 +52 +-240 +-153 + + +134 +-686 +0 +16 +-12 +-553 +-68 +44 +-8 +96 +-9 +88 +124 +41 +36 +384 +11 +216 +-177 +-71 + + +165 +-261 +70 +110 +77 +-521 +-4 +147 +95 +201 +90 +121 +124 +91 +107 +425 +-527 +314 +-95 +8 + + +147 +-614 +89 +129 +93 +-121 +12 +160 +113 +217 +108 +144 +144 +111 +125 +447 +-241 +332 +-81 +22 + + + + + + +0.240000 +0.000000 +0.000000 +0.000000 +0.000000 +0.680000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.080000 +0.000000 +0.000000 +0.000000 + + +0.280000 +0.000000 +0.000000 +0.000000 +0.000000 +0.680000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.040000 +0.000000 +0.000000 +0.000000 + + +0.160000 +0.320000 +0.000000 +0.000000 +0.000000 +0.360000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.160000 +0.000000 +0.000000 +0.000000 + + +0.320000 +0.000000 +0.000000 +0.000000 +0.000000 +0.640000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.040000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.040000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.960000 +0.000000 +0.000000 +0.000000 + + +0.960000 +0.040000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +1.000000 +0.000000 +0.000000 +0.000000 + + +1.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.760000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.240000 +0.000000 +0.000000 +0.000000 + + +0.960000 +0.040000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 + + +0.840000 +0.000000 +0.000000 +0.000000 +0.000000 +0.120000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.000000 +0.040000 +0.000000 +0.000000 +0.000000 + + + + +[GA][GA][GC][GA]TATA[AT]AA + + + +AAGGCCAGGA + + + + + + + + + + + + + +GCCTGAGAGC + + +ACAGGCCCTG + + + + + + + + + + + + + +GCC + + +CAGGCCCTG + + + + + + + + + + + + + +GCCCCAGCAG + + +GATTCACTGA + + + + + + + + + + + + + +GGCCCTCTGC + + +CCAAGGA + + + + + + + + + + + + + +GCCCCACAAA + + +CCACCAGCTT + + + + + + + + + + + + + +AGCCCTGTAC + + +ATACCCAGGG + + + + + + + + + + + + + +CCTCAGCAGC + + +AATCACTGAG + + + + + + + + + + + + + +GTCCCAGGGA + + +CACCAGAGCT + + + + + + + + + + + + + +AGAAGGTTCT + + +CACTATTGAA + + + + + + + + + + + + + +TTTCATTTGC + + +GA + + + + + + + + + + + + + +GCCAACATCC + + +CCGGCGGGGC + + + + + + + + + + + + + +GGGGCGG + + +CAGA + + + + + + + + + + + + + +GTTCCGACCA + + +CCCACTACTT + + + + + + + + + + + + + +TCATTCTGAG + + +CACCAGCAAG + + + + + + + + + + + + + +GCTCAGGAGT + + +CAGGTCTAAG + + + + + + + + + + + + + +CTTGGAGTCC + + +CCTCGGGACG + + + + + + + + + + + + + + + + +CGTGGTCGCG + + + + + + + + + + + + + +GC + + + + + + + + + + + + + + + + +ATGGTCCTGT + + +GCTGCCGGTG + + + + + + + + + + + + + +GCCCTGGCG + + +AGTCACAAGT + + + + + + + + + + + + + +GGGTCGCACG + + +CCCAGGTTTC + + + + + + + + + + + + + +TCGCCGCACC + + +AGTTTCAGTT + + + + + + + + + + + + + +attatataac + + +TC + + + + + + + + + + + + + +AAATGTTCCT + + +TATAACTCAG + + + + + + + + + + + + + +TAATTTGTAC + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test2.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test2.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,9578 @@ + * See http://stackoverflow.com/a/5450113/66387 + * Does string multiplication like the perl x operator. + */ +function string_mult(pattern, count) { + if (count < 1) return ''; + var result = ''; + while (count > 1) { + if (count & 1) result += pattern; + count >>= 1, pattern += pattern; + } + return result + pattern; +} + +/* + * See http://stackoverflow.com/questions/814613/how-to-read-get-data-from-a-url-using-javascript + * Slightly modified with information from + * https://developer.mozilla.org/en/DOM/window.location + */ +function parse_params() { + "use strict"; + var search, queryStart, queryEnd, query, params, nvPairs, i, nv, n, v; + search = window.location.search; + queryStart = search.indexOf("?") + 1; + queryEnd = search.indexOf("#") + 1 || search.length + 1; + query = search.slice(queryStart, queryEnd - 1); + + if (query === search || query === "") return {}; + + params = {}; + nvPairs = query.replace(/\+/g, " ").split("&"); + + for (i = 0; i < nvPairs.length; i++) { + nv = nvPairs[i].split("="); + n = decodeURIComponent(nv[0]); + v = decodeURIComponent(nv[1]); + // allow a name to be used multiple times + // storing each value in the array + if (!(n in params)) { + params[n] = []; + } + params[n].push(nv.length === 2 ? v : null); + } + return params; +} + +/* + * coords + * + * Calculates the x and y offset of an element. + * From http://www.quirksmode.org/js/findpos.html + * with alterations to take into account scrolling regions + */ +function coords(elem) { + var myX = myY = 0; + if (elem.getBoundingClientRect) { + var rect; + rect = elem.getBoundingClientRect(); + myX = rect.left + ((typeof window.pageXOffset !== "undefined") ? + window.pageXOffset : document.body.scrollLeft); + myY = rect.top + ((typeof window.pageYOffset !== "undefined") ? + window.pageYOffset : document.body.scrollTop); + } else { + // this fall back doesn't properly handle absolutely positioned elements + // inside a scrollable box + var node; + if (elem.offsetParent) { + // subtract all scrolling + node = elem; + do { + myX -= node.scrollLeft ? node.scrollLeft : 0; + myY -= node.scrollTop ? node.scrollTop : 0; + } while (node = node.parentNode); + // this will include the page scrolling (which is unwanted) so add it back on + myX += (typeof window.pageXOffset !== "undefined") ? window.pageXOffset : document.body.scrollLeft; + myY += (typeof window.pageYOffset !== "undefined") ? window.pageYOffset : document.body.scrollTop; + // sum up offsets + node = elem; + do { + myX += node.offsetLeft; + myY += node.offsetTop; + } while (node = node.offsetParent); + } + } + return [myX, myY]; +} + +/* + * position_popup + * + * Positions a popup relative to an anchor element. + * + * The available positions are: + * 0 - Centered below the anchor. + */ +function position_popup(anchor, popup, position) { + "use strict"; + var a_x, a_y, a_w, a_h, p_x, p_y, p_w, p_h; + var a_xy, spacer, margin, scrollbar, page_w; + // define constants + spacer = 5; + margin = 15; + scrollbar = 15; + // define the positions and widths + a_xy = coords(anchor); + a_x = a_xy[0]; + a_y = a_xy[1]; + a_w = anchor.offsetWidth; + a_h = anchor.offsetHeight; + p_w = popup.offsetWidth; + p_h = popup.offsetHeight; + page_w = null; + if (window.innerWidth) { + page_w = window.innerWidth; + } else if (document.body) { + page_w = document.body.clientWidth; + } + // check the position type is defined + if (typeof position !== "number") { + position = 0; + } + // calculate the popup position + switch (position) { + case 1: + p_x = a_x + a_w + spacer; + p_y = a_y + (a_h / 2) - (p_h / 2); + break; + case 0: + default: + p_x = a_x + (a_w / 2) - (p_w / 2); + p_y = a_y + a_h + spacer; + break; + } + // constrain the popup position + if (p_x < margin) { + p_x = margin; + } else if (page_w != null && (p_x + p_w) > (page_w - margin - scrollbar)) { + p_x = page_w - margin - scrollbar - p_w; + } + if (p_y < margin) { + p_y = margin; + } + // position the popup + popup.style.left = p_x + "px"; + popup.style.top = p_y + "px"; +} + +function lookup_help_popup(popup_id) { + var _body, pop, info; + pop = document.getElementById(popup_id); + if (pop == null) { + _body = document.getElementsByTagName("body")[0]; + pop = document.createElement("div"); + pop.className = "pop_content"; + pop.id = popup_id; + pop.style.backgroundColor = "#FFC"; + pop.style.borderColor = "black"; + info = document.createElement("p"); + info.style.fontWeight = "bold"; + info.appendChild(document.createTextNode("Error: No popup for topic \"" + popup_id + "\".")); + pop.appendChild(info); + // this might cause problems with the menu, but as this only happens + // when something is already wrong I don't think that's too much of a problem + _body.insertBefore(pop, _body.firstChild); + } + if (document.getElementsByTagName('body')[0].hasAttribute("data-autobtns")) { + if (!/\bauto_buttons\b/.test(pop.className)) { + pop.className += " auto_buttons"; + var back_btn_sec = document.createElement("div"); + back_btn_sec.className = "nested_only pop_back_sec"; + var back_btn = document.createElement("span"); + back_btn.className = "pop_back"; + back_btn.appendChild(document.createTextNode("<< back")); + back_btn.addEventListener("click", function(e) { + help_return(); + }, false); + back_btn_sec.appendChild(back_btn); + pop.insertBefore(back_btn_sec, pop.firstChild); + var close_btn_sec = document.createElement("div"); + close_btn_sec.className = "pop_close_sec"; + var close_btn = document.createElement("span"); + close_btn.className = "pop_close"; + close_btn.appendChild(document.createTextNode("close")); + close_btn.addEventListener("click", function(e) { + help_popup(); + }, false); + close_btn_sec.appendChild(close_btn); + pop.appendChild(close_btn_sec); + } + } + return pop; +} + +/* + * help_popup + * + * Moves around help pop-ups so they appear + * below an activator. + */ +function help_popup(activator, popup_id) { + "use strict"; + var pop; + // set default values + if (typeof help_popup.popup === "undefined") { + help_popup.popup = []; + } + if (typeof help_popup.activator === "undefined") { + help_popup.activator = null; + } + var last_pop = (help_popup.popup.length > 0 ? help_popup.popup[help_popup.popup.length - 1] : null); + if (typeof(activator) == "undefined") { // no activator so hide + if (last_pop != null) { + last_pop.style.display = 'none'; + help_popup.popup = []; + } + return; + } + pop = lookup_help_popup(popup_id); + if (pop == last_pop) { + if (activator == help_popup.activator) { + //hide popup (as we've already shown it for the current help button) + last_pop.style.display = 'none'; + help_popup.popup = []; + return; // toggling complete! + } + } else if (last_pop != null) { + //activating different popup so hide current one + last_pop.style.display = 'none'; + } + help_popup.popup = [pop]; + help_popup.activator = activator; + toggle_class(pop, "nested", false); + //must make the popup visible to measure it or it has zero width + pop.style.display = 'block'; + position_popup(activator, pop); +} + +/* + * help_refine + * + * Intended for links within a help popup. Stores a stack of state so + * you can go back. + */ +function help_refine(popup_id) { + if (help_popup.popup == null || help_popup.popup.length == 0 || help_popup.activator == null) { + //throw new Error("Cannot refine a help popup when one is not shown!"); + var pop = lookup_help_popup(popup_id); + var act_id = popup_id + '_act'; + var activator = document.getElementById(act_id); + help_popup(activator, popup_id); + } + var pop = lookup_help_popup(popup_id); + var last_pop = help_popup.popup[help_popup.popup.length - 1]; + if (pop == last_pop) return; // slightly odd, but no real cause for alarm + help_popup.popup.push(pop); + toggle_class(pop, "nested", true); + last_pop.style.display = "none"; + //must make the popup visible to measure it or it has zero width + pop.style.display = "block"; + position_popup(help_popup.activator, pop); +} + +/* + * help_return + * + * Intended for links within a help popup. Stores a stack of state so + * you can go back. + */ +function help_return() { + if (help_popup.popup == null || help_popup.popup.length == 0 || help_popup.activator == null) { + throw new Error("Can not return to a earlier help popup when one is not shown!"); + } + var last_pop = help_popup.popup.pop(); + last_pop.style.display = "none"; + var pop = (help_popup.popup.length > 0 ? help_popup.popup[help_popup.popup.length - 1] : null); + if (pop != null) { + toggle_class(pop, "nested", help_popup.popup.length > 1); + pop.style.display = "block"; + position_popup(help_popup.activator, pop); + } else { + help_popup.activator = null; + } +} + +/* + * update_scroll_pad + * + * Creates padding at the bottom of the page to allow + * scrolling of anything into view. + */ +function update_scroll_pad() { + var page, pad; + page = (document.compatMode === "CSS1Compat") ? document.documentElement : document.body; + pad = $("scrollpad"); + if (pad === null) { + pad = document.createElement("div"); + pad.id = 'scrollpad'; + document.getElementsByTagName('body')[0].appendChild(pad); + } + pad.style.height = Math.abs(page.clientHeight - 100) + "px"; +} + +function substitute_classes(node, remove, add) { + "use strict"; + var list, all, i, cls, classes; + list = node.className.split(/\s+/); + all = {}; + for (i = 0; i < list.length; i++) { + if (list[i].length > 0) all[list[i]] = true; + } + for (i = 0; i < remove.length; i++) { + if (all.hasOwnProperty(remove[i])) { + delete all[remove[i]]; + } + } + for (i = 0; i < add.length; i++) { + all[add[i]] = true; + } + classes = ""; + for (cls in all) { + classes += cls + " "; + } + node.className = classes; +} + +/* + * toggle_class + * + * Adds or removes a class from the node. If the parameter 'enabled' is not + * passed then the existence of the class will be toggled, otherwise it will be + * included if enabled is true. + */ +function toggle_class(node, cls, enabled) { + var classes = node.className; + var list = classes.replace(/^\s+/, '').replace(/\s+$/, '').split(/\s+/); + var found = false; + for (var i = 0; i < list.length; i++) { + if (list[i] == cls) { + list.splice(i, 1); + i--; + found = true; + } + } + if (typeof enabled == "undefined") { + if (!found) list.push(cls); + } else { + if (enabled) list.push(cls); + } + node.className = list.join(" "); +} + +/* + * find_child + * + * Searches child nodes in depth first order and returns the first it finds + * with the className specified. + * TODO replace with querySelector + */ +function find_child(node, className) { + var pattern; + if (node == null || typeof node !== "object") { + return null; + } + if (typeof className === "string") { + pattern = new RegExp("\\b" + className + "\\b"); + } else { + pattern = className; + } + if (node.nodeType == Node.ELEMENT_NODE && + pattern.test(node.className)) { + return node; + } else { + var result = null; + for (var i = 0; i < node.childNodes.length; i++) { + result = find_child(node.childNodes[i], pattern); + if (result != null) break; + } + return result; + } +} + +/* + * find_parent + * + * Searches parent nodes outwards from the node and returns the first it finds + * with the className specified. + */ +function find_parent(node, className) { + var pattern; + pattern = new RegExp("\\b" + className + "\\b"); + do { + if (node.nodeType == Node.ELEMENT_NODE && + pattern.test(node.className)) { + return node; + } + } while (node = node.parentNode); + return null; +} + +/* + * find_parent_tag + * + * Searches parent nodes outwards from the node and returns the first it finds + * with the tag name specified. HTML tags should be specified in upper case. + */ +function find_parent_tag(node, tag_name) { + do { + if (node.nodeType == Node.ELEMENT_NODE && node.tagName == tag_name) { + return node; + } + } while (node = node.parentNode); + return null; +} + +/* + * __toggle_help + * + * Uses the 'topic' property of the this object to + * toggle display of a help topic. + * + * This function is not intended to be called directly. + */ +function __toggle_help(e) { + if (!e) e = window.event; + if (e.type === "keydown") { + if (e.keyCode !== 13 && e.keyCode !== 32) { + return; + } + // stop a submit or something like that + e.preventDefault(); + } + + help_popup(this, this.getAttribute("data-topic")); +} + +function setup_help_button(button) { + "use strict"; + var topic; + if (button.hasAttribute("data-topic")) { + topic = button.getAttribute("data-topic"); + if (document.getElementById(topic) != null) { + button.tabIndex = "0"; // make keyboard selectable + button.addEventListener("click", function() { + help_popup(button, topic); + }, false); + button.addEventListener("keydown", function(e) { + // toggle only on Enter or Spacebar, let other keys do their thing + if (e.keyCode !== 13 && e.keyCode !== 32) return; + // stop a submit or something like that + e.preventDefault(); + help_popup(button, topic); + }, false); + } else { + button.style.visibility = "hidden"; + } + } + button.className += " active"; +} + +/* + * help_button + * + * Makes a help button for the passed topic. + */ +function help_button(topic) { + var btn = document.createElement("div"); + btn.className = "help"; + btn.setAttribute("data-topic", topic); + setup_help_button(btn); + return btn; +} + +/* + * prepare_download + * + * Sets the attributes of a link to setup a file download using the given content. + * If no link is provided then create one and click it. + */ +function prepare_download(content, mimetype, filename, link) { + "use strict"; + // if no link is provided then create one and click it + var click_link = false; + if (!link) { + link = document.createElement("a"); + click_link = true; + } + try { + // Use a BLOB to convert the text into a data URL. + // We could do this manually with a base 64 conversion. + // This will only be supported on modern browsers, + // hence the try block. + var blob = new Blob([content], {type: mimetype}); + var reader = new FileReader(); + reader.onloadend = function() { + // If we're lucky the browser will also support the download + // attribute which will let us suggest a file name to save the link. + // Otherwise it is likely that the filename will be unintelligible. + link.setAttribute("download", filename); + link.href = reader.result; + if (click_link) { + // must add the link to click it + document.body.appendChild(link); + link.click(); + document.body.removeChild(link); + } + } + reader.readAsDataURL(blob); + } catch (error) { + if (console && console.log) console.log(error); + // probably an old browser + link.href = ""; + link.visible = false; + } +} + +/* + * add_cell + * + * Add a cell to the table row. + */ +function add_cell(row, node, cls, click_action) { + var cell = row.insertCell(row.cells.length); + if (node) cell.appendChild(node); + if (cls && cls !== "") cell.className = cls; + if (click_action) cell.addEventListener("click", click_action, false); +} + +/* + * add_header_cell + * + * Add a header cell to the table row. + */ +function add_header_cell(row, node, help_topic, cls, colspan, is_new) { + var th = document.createElement("th"); + if (node) th.appendChild(node); + if (help_topic && help_topic !== "") th.appendChild(help_button(help_topic)); + if (is_new && is_new !== "") { + var br = document.createElement("span"); + br.innerHTML = "
"; + th.appendChild(br); + var new_icon = document.createElement("img"); + new_icon.src = new_icon_src; + new_icon.alt = "NEW"; + th.appendChild(new_icon); + } + if (cls && cls !== "") th.className = cls; + if (typeof colspan == "number" && colspan > 1) th.colSpan = colspan; + row.appendChild(th); +} + +/* + * add_text_cell + * + * Add a text cell to the table row. + */ +function add_text_cell(row, text, cls, action) { + var node = null; + if (typeof(text) != 'undefined') node = document.createTextNode(text); + add_cell(row, node, cls, action); +} + +/* + * add_text_header_cell + * + * Add a text header cell to the table row. + */ +function add_text_header_cell(row, text, help_topic, cls, action, colspan, is_new) { + var node = null; + if (typeof(text) != 'undefined') { + var nbsp = (help_topic ? "\u00A0" : ""); + var str = "" + text; + var parts = str.split(/\n/); + if (parts.length === 1) { + if (action) { + node = document.createElement("span"); + node.appendChild(document.createTextNode(str + nbsp)); + } else { + node = document.createTextNode(str + nbsp); + } + } else { + node = document.createElement("span"); + for (var i = 0; i < parts.length; i++) { + if (i !== 0) { + node.appendChild(document.createElement("br")); + } + node.appendChild(document.createTextNode(parts[i])); + } + } + if (action) { + node.addEventListener("click", action, false); + node.style.cursor = "pointer"; + } + } + add_header_cell(row, node, help_topic, cls, colspan, is_new); +} + +function setup_help() { + "use strict"; + var help_buttons, i; + help_buttons = document.querySelectorAll(".help:not(.active)"); + for (i = 0; i < help_buttons.length; i++) { + setup_help_button(help_buttons[i]); + } +} + +function setup_scrollpad() { + "use strict"; + if (document.getElementsByTagName('body')[0].hasAttribute("data-scrollpad") && document.getElementById("scrollpad") == null) { + window.addEventListener("resize", update_scroll_pad, false); + update_scroll_pad(); + } +} + +// anon function to avoid polluting global scope +(function() { + "use strict"; + window.addEventListener("load", function load(evt) { + window.removeEventListener("load", load, false); + setup_help(); + setup_scrollpad(); + }, false); +})(); + +/* + * make_link + * + * Creates a text node and if a URL is specified it surrounds it with a link. + * If the URL doesn't begin with "http://" it automatically adds it, as + * relative links don't make much sense in this context. + */ +function make_link(text, url) { + var textNode = null; + var link = null; + if (typeof text !== "undefined" && text !== null) textNode = document.createTextNode(text); + if (typeof url === "string") { + if (url.indexOf("//") == -1) { + url = "http://" + url; + } + link = document.createElement('a'); + link.href = url; + if (textNode) link.appendChild(textNode); + return link; + } + return textNode; +} + +// +// Function to create an HTML paragraph describing the +// MEME Suite background model source. +// +function make_background_source(title, source, text) { + var paraNode = document.createElement("P"); + var titleNode = document.createElement("B"); + var textNode1 = document.createTextNode("\u00A0\u00A0\u00A0\u00A0" + title + ": "); + titleNode.appendChild(textNode1); + var source_text = ((source == "--motif--") ? "the (first) motif file" : (source == "--nrdb--") ? "an old version of the NCBI non-redundant database" : (source == "--uniform--") ? "the uniform model" : (source == "--query--") ? "the query file" : (source == "--sequences--") ? "built from the (primary) sequences" : (source == "--control--") ? "built from the control (negative) sequences" : ((source == "--negatives--") ? "built from the negative (control) sequences" : "the file '" + source + "'")); + if (text) { return source_text; } + var textNode2 = document.createTextNode(source_text); + paraNode.appendChild(titleNode); + paraNode.appendChild(textNode2); + return paraNode; +} + +// Function to create a help button +function make_help_button(container, help_topic) { + container.appendChild(help_button(help_topic)); +} + +// Function to toggle display. +function change_display(id) { + var element=document.getElementById(id); + element.style.display=(element.style.display=='none') ? element.style.display='inline' : element.style.display='none'; +} + + + + + + + + + + + + + + + + + + + + +
+

MEME results in plain text format.

+
[ + close ]
+
+
+

MEME results in XML format.

+
[ + close ]
+
+
+

Help poup.

+
[ + close ]
+
+ +
+

The statistical significance of the motif. MEME usually finds the most + statistically significant (low E-value) motifs first. It is unusual to + consider a motif with an E-value larger than 0.05 significant so, as an + additional indicator, MEME displays these greyed out.

+

The E-value of a motif is based on its log likelihood ratio, width, + sites, the background letter frequencies (given in the command line + summary), and the size of the training set.

+

The E-value is an estimate of the expected number of motifs with the + given log likelihood ratio (or higher), and with the same width and site + count, that one would find in a similarly sized set of random + sequences (sequences where each position is independent and letters are + chosen according to the background letter frequencies).

+
[ + close ]
+
+
+

The number of sites contributing to the construction of the motif.

+
[ + close ]
+
+
+

The width of the motif. Each motif describes a pattern of a fixed + width, as no gaps are allowed in MEME motifs.

+
[ + close ]
+
+
+ + +
+
+ +
[ + close ]
+
+
+

The log likelihood ratio of the motif. The log likelihood ratio is the + logarithm of the ratio of the probability of the occurrences of the motif + given the motif model (likelihood given the motif) versus their + probability given the background model (likelihood given the null model). + (Normally the background model is a 0-order Markov model using the + background letter frequencies, but higher order Markov models may be + specified via the -bfile option to MEME.).

+
[ + close ]
+
+
+

The information content of the motif in bits. It is equal to the sum + of the uncorrected information content, R(), in the columns of the motif. + This is equal relative entropy of the motif relative to a uniform + background frequency model.

+
[ + close ]
+
+
+

The relative entropy of the motif.

+ +

re = llr / (sites * ln(2))

+
[ + close ]
+
+
+

The Bayes Threshold.

+
[ + close ]
+
+
+

The strand used for the motif site.

+
+
+
+
The motif site was found in the sequence as it was supplied.
+
-
+
The motif site was found in the reverse complement of the supplied sequence.
+
+
[ + close ]
+
+
+

The position in the sequence where the motif site starts. If a motif + started right at the beginning of a sequence it would be described as + starting at position 1.

+
[ + close ]
+
+
+

The probability that an equal or better site would be found in a + random sequence of the same length conforming to the background letter + frequencies.

+
[ + close ]
+
+
+

A motif site with the 10 flanking letters on either side.

+

When the site is not on the given strand then the site + and both flanks are reverse complemented so they align.

+
[ + close ]
+
+ +
+

The name of the sequences as given in the FASTA file.

+

The number to the left of the sequence name is the position + of the sequence in the input sequence file.

+
[ + close ]
+
+ +
+

These are the motif sites predicted by MEME and used to build the motif.

+

These sites are shown in solid color and hovering the cursor + over a site will reveal details about the site. Only sequences + that contain a motif site are shown.

+
[ + close ]
+
+ +
+

These are the motif sites predicted by MEME plus + any additional sites detected using a motif scanning + algorithm.

+

These MEME sites are shown in solid color and + additional scanned sites are shown greyed out. + Hovering the cursor over a site will reveal details about the site. + Only sequences containing a predicted or scanned motif site are shown.

+

The scanned sites are predicted using a + log-odds scoring matrix constructed from the MEME sites. + Only scanned sites with position p-values less + than 0.0001 are shown.

+
[ + close ]
+
+ +
+

These are the same sites as shown by selecting the + "Motif Sites + Scanned Sites" button except that all + sequences, including those with no sites, are included + in the diagram.

+
[ + close ]
+
+ +
+

This is the combined match p-value.

+

The combined match p-value is defined as the probability that a + random sequence (with the same length and conforming to the background) + would have position p-values such that the product is smaller + or equal to the value calculated for the sequence under test.

+

The position p-value is defined as the probability that a + random sequence (with the same length and conforming to the background) + would have a match to the motif under test with a score greater or equal + to the largest found in the sequence under test.

+

Hovering your mouse over a motif site in the motif location + block diagram will show its position p-value and other information + about the site.

+
[ + close ]
+
+ +
+

Use this button to download the "Motif Locations" block diagrams + as a PDF image suitable for publication. +

+

+ Only the block diagrams currently visible in the inner scrolling + window (below) will be included in the image, and the numbers to + the left of each sequence name will not be included in the image. + You can change the size of the inner scrolling by moving the bottom + of the main document window up and down. You can display more + diagrams by making your browser's font size smaller. +

+
[ + close ]
+
+ +
+

Use this button to download the "Motif Locations" block diagrams + as a SVG image use in HTML documents. +

+

+ Only the block diagrams currently visible in the inner scrolling + window (below) will be included in the image, and the numbers to + the left of each sequence name will not be included in the image. + You can change the size of the inner scrolling by moving the bottom + of the main document window up and down. You can display more + diagrams by making your browser's font size smaller. +

+
[ + close ]
+
+ +
+

+ This button will only function if your browser was + connected to the internet when you loaded this page. +

+

+ To use this button, make sure your browser is connected to the internet + and then reload this page. (You may need to do a "hard refresh" to clear the cache. + On Mac, hold down the Shift key and click the Reload button. + On Windows/Linux, hold down Ctrl and press F5.) +

+
[ + close ]
+
+ +
+

This diagram shows the location of motif sites.

+

Each block shows the position and strength of a motif + site. The height of a block gives an indication of the + significance of the site as taller blocks are more significant. + The height is calculated to be proportional to the negative + logarithm of the p-value of the site, truncated at + the height for a p-value of 1e-10.

+

For complementable alphabets (like DNA), sites on the + positive strand are shown above the line, + sites on the negative strand are shown below.

+

Placing the cursor + over a motif site will reveal more information about the site + including its position p-value. (See the help + for the p-value column for an explanation of position + p-values.)

+
[ + close ]
+
+ +
+

The name of the file(s) of sequences input to MEME.

+
[ + close ]
+
+
+

The position specific priors file used by MEME to find the motifs.

+
[ + close ]
+
+
+

The alphabet used by the sequences.

+
[ + close ]
+
+
+

The number of FASTA sequences provided in this input file.

+
[ + close ]
+
+
+

The number of characters in the sequences provided in this FASTA input file.

+
[ + close ]
+
+ +
+

The name of the alphabet symbol.

+
[ + close ]
+
+
+

The frequency of the alphabet symbol in the dataset.

+
[ + close ]
+
+
+

The frequency of the alphabet symbol as defined by the background model.

+
[ + close ]
+
+ + +
+
+
+ + +
+
+ + + +
+ + + + + +
Motif1
p-value8.23e-7
Start23
End33
+
+ +
+
Scanned Site
+ + + + + + +
Motif1
p-value8.23e-7
Start23
End33
+
+ +
+
+
+ . +
+
+
+
+
+
+ E-value: + +
+
+
+ Site Count: + +
+
+
+ Width: + +
+
+
+
+ +
+
+ StandardReverse + Complement +
+
+
+ Log Likelihood Ratio: + +
+
+
+ Information Content: + +
+
+
+ Relative Entropy: + +
+
+
+ Bayes Threshold: + +
+
+
+
+
+ +
+ + + +
+ +

+ For further information on how to interpret these results please access + https://meme-suite.org/meme/doc/meme.html.
+ To get a copy of the MEME software please access + https://meme-suite.org. +

+

+
+ +
+ Discovered Motifs +   |   + Motif Locations +   |   + Inputs & Settings +   |   + Program Information +   |   + Results in Text Format  +   |   + Results in XML Format  + +
+ + +

Your browser does not support canvas!

+ +

Discovered Motifs

+
+

Please wait... Loading...

+

If the page has fully loaded and this message does not disappear then an error may have occurred.

+
+

Motif Locations

+
+

Please wait... Loading...

+

If the page has fully loaded and this message does not disappear then an error may have occurred.

+
+

Inputs & Settings

+
+

Sequences

+ + + + + + + + + + + + + + + + + + + + + + + + + +
Role
Source
PSP Source
Alphabet
Sequence Count
Total Size
Primary Sequences
Control Sequences
+ +

Background Model

+ + + + +

Other Settings

+ + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +
Motif Site Distribution + ZOOPS: Zero or one site per sequence + OOPS: Exactly one site per sequence + ANR: Any number of sites per sequence +
Objective Function
Starting Point Function
Site Strand Handling + This alphabet only has one strand + Sites must be on the given strand + Sites may be on either strand +
Maximum Number of Motifs
Motif E-value Threshold
Minimum Motif Width
Maximum Motif Width
Minimum Sites per Motif
Maximum Sites per Motif
Bias on Number of Sites
Sequence Prior + Simple Dirichlet + Dirichlet Mixture + Mega-weight Dirichlet Mixture + Mega-weight Dirichlet Mixture Plus + Add One +
Sequence Prior Source
Sequence Prior Strength
EM Starting Point Source + From substrings in input sequences + From strings on command line (-cons) +
EM Starting Point Map Type + Uniform + Point Accepted Mutation +
EM Starting Point Fuzz
EM Maximum Iterations
EM Improvement Threshold
Maximum Search Size
Maximum Number of Sites for E-values
Trim Gap Open Cost
Trim Gap Extend Cost
End Gap Treatment + No cost + Same cost as other gaps +
+ + Show Advanced Settings + Hide Advanced Settings + +
+ +
+ +
+
+
MEME version
+ + (Release date: )
+
+ +
+
+
Command line
+ + +
+
+ + + diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test2.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test2.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,180 @@ +******************************************************************************** +MOTIF GGSRTATAAAA MEME-1 width = 11 sites = 30 llr = 254 E-value = 5.1e-040 +******************************************************************************** +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 Description +-------------------------------------------------------------------------------- +Simplified A 3313:9:a798 +pos.-specific C 1:3::1:::1: +probability G 6756::::::2 +matrix T 1:11a1a:3:: + + bits 2.2 * + 2.0 * * + 1.8 * * + 1.5 * ** * +Relative 1.3 * ** * +Entropy 1.1 ****** +(12.2 bits) 0.9 * ******* + 0.7 * ******* + 0.4 ** ******** + 0.2 *********** + 0.0 ----------- + +Multilevel GGGGTATAAAA +consensus AACA T +sequence + +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 sites sorted by position p-value +-------------------------------------------------------------------------------- +Sequence name Start P-value Site +------------- ----- --------- ----------- +chr21_46046964_46047014_ 13 4.51e-07 AAGGCCAGGA GGGGTATAAAA GCCTGAGAGC +chr21_46031920_46031970_ 16 2.22e-06 ATACCCAGGG AGGGTATAAAA CCTCAGCAGC +chr21_32202076_32202126_ 14 2.74e-06 CCACCAGCTT GAGGTATAAAA AGCCCTGTAC +chr21_46057197_46057247_ 37 4.86e-06 ACAGGCCCTG GGCATATAAAA GCC +chr21_45993530_45993580_ 8 4.86e-06 CCAAGGA GGAGTATAAAA GCCCCACAAA +chr21_45971413_45971463_ 10 4.86e-06 CAGGCCCTG GGCATATAAAA GCCCCAGCAG +chr21_31964683_31964733_ 14 4.86e-06 GATTCACTGA GGCATATAAAA GGCCCTCTGC +chr21_47517957_47518007_ 33 6.48e-06 CCGGCGGGGC GGGGTATAAAG GGGGCGG +chr21_45978668_45978718_ 5 6.48e-06 CAGA GGGGTATAAAG GTTCCGACCA +chr21_32185595_32185645_ 19 6.48e-06 CACCAGAGCT GGGATATATAA AGAAGGTTCT +chr21_32410820_32410870_ 22 1.38e-05 AATCACTGAG GATGTATAAAA GTCCCAGGGA +chr21_31992870_31992920_ 17 1.38e-05 CACTATTGAA GATGTATAAAA TTTCATTTGC +chr21_19617074_19617124_ 40 1.41e-05 CCTCGGGACG TGGGTATATAA +chr21_31914206_31914256_ 16 1.61e-05 CCCACTACTT AGAGTATAAAA TCATTCTGAG +chr21_46020421_46020471_ 3 1.95e-05 GA GACATATAAAA GCCAACATCC +chr21_32253899_32253949_ 18 1.95e-05 CCCACCAGCA AGGATATATAA AAGCTCAGGA +chr21_45705687_45705737_ 38 2.16e-05 CGTGGTCGCG GGGGTATAACA GC +chr21_47575506_47575556_ 31 3.04e-05 GCTGCCGGTG AGCGTATAAAG GCCCTGGCG +chr21_31744582_31744632_ 13 3.04e-05 CAGGTCTAAG AGCATATATAA CTTGGAGTCC +chr21_31768316_31768366_ 1 3.67e-05 . AACGTATATAA ATGGTCCTGT +chr21_26934381_26934431_ 28 3.93e-05 AGTCACAAGT GAGTTATAAAA GGGTCGCACG +chr21_31933633_31933683_ 5 5.65e-05 TCAG AGTATATATAA ATGTTCCTGT +chr21_31710037_31710087_ 15 6.24e-05 CCCAGGTTTC TGAGTATATAA TCGCCGCACC +chr21_36411748_36411798_ 23 7.15e-05 AGTTTCAGTT GGCATCtaaaa attatataac +chr21_46102103_46102153_ 37 1.39e-04 TGCCTGGGTC CAGGTATAAAG GCT +chr21_46086869_46086919_ 38 1.39e-04 TGCCTGGGCC CAGGTATAAAG GC +chr21_37838750_37838800_ 3 4.81e-04 ga tggttttataa ggggcctcac +chr21_31962741_31962791_ 14 8.57e-04 TATAACTCAG GTTGGATAAAA TAATTTGTAC +chr21_31973364_31973414_ 8 1.47e-03 aaactta aaactctataa acttaaaact +chr21_28217753_28217803_ 27 2.64e-03 GGTGGGGGTG GGGGTTTCACT GGTCCACTAT +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 block diagrams +-------------------------------------------------------------------------------- +SEQUENCE NAME POSITION P-VALUE MOTIF DIAGRAM +------------- ---------------- ------------- +chr21_46046964_46047014_ 4.5e-07 12_[+1]_27 +chr21_46031920_46031970_ 2.2e-06 15_[+1]_24 +chr21_32202076_32202126_ 2.7e-06 13_[+1]_26 +chr21_46057197_46057247_ 4.9e-06 36_[+1]_3 +chr21_45993530_45993580_ 4.9e-06 7_[+1]_32 +chr21_45971413_45971463_ 4.9e-06 9_[+1]_30 +chr21_31964683_31964733_ 4.9e-06 13_[+1]_26 +chr21_47517957_47518007_ 6.5e-06 32_[+1]_7 +chr21_45978668_45978718_ 6.5e-06 4_[+1]_35 +chr21_32185595_32185645_ 6.5e-06 18_[+1]_21 +chr21_32410820_32410870_ 1.4e-05 21_[+1]_18 +chr21_31992870_31992920_ 1.4e-05 16_[+1]_23 +chr21_19617074_19617124_ 1.4e-05 39_[+1] +chr21_31914206_31914256_ 1.6e-05 15_[+1]_24 +chr21_46020421_46020471_ 1.9e-05 2_[+1]_37 +chr21_32253899_32253949_ 1.9e-05 17_[+1]_22 +chr21_45705687_45705737_ 2.2e-05 37_[+1]_2 +chr21_47575506_47575556_ 3e-05 30_[+1]_9 +chr21_31744582_31744632_ 3e-05 12_[+1]_27 +chr21_31768316_31768366_ 3.7e-05 [+1]_39 +chr21_26934381_26934431_ 3.9e-05 27_[+1]_12 +chr21_31933633_31933683_ 5.6e-05 4_[+1]_35 +chr21_31710037_31710087_ 6.2e-05 14_[+1]_25 +chr21_36411748_36411798_ 7.1e-05 22_[+1]_17 +chr21_46102103_46102153_ 0.00014 36_[+1]_3 +chr21_46086869_46086919_ 0.00014 37_[+1]_2 +chr21_37838750_37838800_ 0.00048 2_[+1]_37 +chr21_31962741_31962791_ 0.00086 13_[+1]_26 +chr21_31973364_31973414_ 0.0015 7_[+1]_32 +chr21_28217753_28217803_ 0.0026 26_[+1]_13 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 in BLOCKS format +-------------------------------------------------------------------------------- +BL MOTIF GGSRTATAAAA width=11 seqs=30 +chr21_46046964_46047014_ ( 13) GGGGTATAAAA 1 +chr21_46031920_46031970_ ( 16) AGGGTATAAAA 1 +chr21_32202076_32202126_ ( 14) GAGGTATAAAA 1 +chr21_46057197_46057247_ ( 37) GGCATATAAAA 1 +chr21_45993530_45993580_ ( 8) GGAGTATAAAA 1 +chr21_45971413_45971463_ ( 10) GGCATATAAAA 1 +chr21_31964683_31964733_ ( 14) GGCATATAAAA 1 +chr21_47517957_47518007_ ( 33) GGGGTATAAAG 1 +chr21_45978668_45978718_ ( 5) GGGGTATAAAG 1 +chr21_32185595_32185645_ ( 19) GGGATATATAA 1 +chr21_32410820_32410870_ ( 22) GATGTATAAAA 1 +chr21_31992870_31992920_ ( 17) GATGTATAAAA 1 +chr21_19617074_19617124_ ( 40) TGGGTATATAA 1 +chr21_31914206_31914256_ ( 16) AGAGTATAAAA 1 +chr21_46020421_46020471_ ( 3) GACATATAAAA 1 +chr21_32253899_32253949_ ( 18) AGGATATATAA 1 +chr21_45705687_45705737_ ( 38) GGGGTATAACA 1 +chr21_47575506_47575556_ ( 31) AGCGTATAAAG 1 +chr21_31744582_31744632_ ( 13) AGCATATATAA 1 +chr21_31768316_31768366_ ( 1) AACGTATATAA 1 +chr21_26934381_26934431_ ( 28) GAGTTATAAAA 1 +chr21_31933633_31933683_ ( 5) AGTATATATAA 1 +chr21_31710037_31710087_ ( 15) TGAGTATATAA 1 +chr21_36411748_36411798_ ( 23) GGCATCTAAAA 1 +chr21_46102103_46102153_ ( 37) CAGGTATAAAG 1 +chr21_46086869_46086919_ ( 38) CAGGTATAAAG 1 +chr21_37838750_37838800_ ( 3) TGGTTTTATAA 1 +chr21_31962741_31962791_ ( 14) GTTGGATAAAA 1 +chr21_31973364_31973414_ ( 8) AAACTCTATAA 1 +chr21_28217753_28217803_ ( 27) GGGGTTTCACT 1 +// + +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 position-specific scoring matrix +-------------------------------------------------------------------------------- +log-odds matrix: alength= 4 w= 11 n= 1200 bayes= 5.2854 E= 5.1e-040 + -14 -179 114 -112 + 3 -1155 137 -270 + -114 20 86 -71 + 3 -279 122 -170 + -1155 -1155 -295 215 + 156 -179 -1155 -170 + -1155 -1155 -1155 220 + 172 -279 -1155 -1155 + 125 -1155 -1155 46 + 167 -179 -1155 -1155 + 144 -1155 -63 -270 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 position-specific probability matrix +-------------------------------------------------------------------------------- +letter-probability matrix: alength= 4 w= 11 nsites= 30 E= 5.1e-040 + 0.266667 0.066667 0.566667 0.100000 + 0.300000 0.000000 0.666667 0.033333 + 0.133333 0.266667 0.466667 0.133333 + 0.300000 0.033333 0.600000 0.066667 + 0.000000 0.000000 0.033333 0.966667 + 0.866667 0.066667 0.000000 0.066667 + 0.000000 0.000000 0.000000 1.000000 + 0.966667 0.033333 0.000000 0.000000 + 0.700000 0.000000 0.000000 0.300000 + 0.933333 0.066667 0.000000 0.000000 + 0.800000 0.000000 0.166667 0.033333 +-------------------------------------------------------------------------------- + +-------------------------------------------------------------------------------- + Motif GGSRTATAAAA MEME-1 regular expression +-------------------------------------------------------------------------------- +[GA][GA][GC][GA]TATA[AT]AA +-------------------------------------------------------------------------------- \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/meme_output_test2.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_output_test2.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,713 @@ + + +-14 +-179 +114 +-112 + + +3 +-1155 +137 +-270 + + +-114 +20 +86 +-71 + + +3 +-279 +122 +-170 + + +-1155 +-1155 +-295 +215 + + +156 +-179 +-1155 +-170 + + +-1155 +-1155 +-1155 +220 + + +172 +-279 +-1155 +-1155 + + +125 +-1155 +-1155 +46 + + +167 +-179 +-1155 +-1155 + + +144 +-1155 +-63 +-270 + + + + + + +0.266667 +0.066667 +0.566667 +0.100000 + + +0.300000 +0.000000 +0.666667 +0.033333 + + +0.133333 +0.266667 +0.466667 +0.133333 + + +0.300000 +0.033333 +0.600000 +0.066667 + + +0.000000 +0.000000 +0.033333 +0.966667 + + +0.866667 +0.066667 +0.000000 +0.066667 + + +0.000000 +0.000000 +0.000000 +1.000000 + + +0.966667 +0.033333 +0.000000 +0.000000 + + +0.700000 +0.000000 +0.000000 +0.300000 + + +0.933333 +0.066667 +0.000000 +0.000000 + + +0.800000 +0.000000 +0.166667 +0.033333 + + + + +[GA][GA][GC][GA]TATA[AT]AA + + + +AAGGCCAGGA + + + + + + + + + + + + + +GCCTGAGAGC + + +ATACCCAGGG + + + + + + + + + + + + + +CCTCAGCAGC + + +CCACCAGCTT + + + + + + + + + + + + + +AGCCCTGTAC + + +ACAGGCCCTG + + + + + + + + + + + + + +GCC + + +CCAAGGA + + + + + + + + + + + + + +GCCCCACAAA + + +CAGGCCCTG + + + + + + + + + + + + + +GCCCCAGCAG + + +GATTCACTGA + + + + + + + + + + + + + +GGCCCTCTGC + + +CCGGCGGGGC + + + + + + + + + + + + + +GGGGCGG + + +CAGA + + + + + + + + + + + + + +GTTCCGACCA + + +CACCAGAGCT + + + + + + + + + + + + + +AGAAGGTTCT + + +AATCACTGAG + + + + + + + + + + + + + +GTCCCAGGGA + + +CACTATTGAA + + + + + + + + + + + + + +TTTCATTTGC + + +CCTCGGGACG + + + + + + + + + + + + + + + + +CCCACTACTT + + + + + + + + + + + + + +TCATTCTGAG + + +GA + + + + + + + + + + + + + +GCCAACATCC + + +CCCACCAGCA + + + + + + + + + + + + + +AAGCTCAGGA + + +CGTGGTCGCG + + + + + + + + + + + + + +GC + + +GCTGCCGGTG + + + + + + + + + + + + + +GCCCTGGCG + + +CAGGTCTAAG + + + + + + + + + + + + + +CTTGGAGTCC + + + + + + + + + + + + + + + + +ATGGTCCTGT + + +AGTCACAAGT + + + + + + + + + + + + + +GGGTCGCACG + + +TCAG + + + + + + + + + + + + + +ATGTTCCTGT + + +CCCAGGTTTC + + + + + + + + + + + + + +TCGCCGCACC + + +AGTTTCAGTT + + + + + + + + + + + + + +attatataac + + +TGCCTGGGTC + + + + + + + + + + + + + +GCT + + +TGCCTGGGCC + + + + + + + + + + + + + +GC + + +ga + + + + + + + + + + + + + +ggggcctcac + + +TATAACTCAG + + + + + + + + + + + + + +TAATTTGTAC + + +aaactta + + + + + + + + + + + + + +acttaaaact + + +GGTGGGGGTG + + + + + + + + + + + + + +GGTCCACTAT + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + diff -r 000000000000 -r 7653ebd919bb test-data/meme_psp_output_test1.memepsp --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_psp_output_test1.memepsp Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,6 @@ +>BBP_PIEBR 20 scaledmin = 0.1 scaledmax = 0.9 +0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0.006488825 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 +>ICYA_MANSE 20 scaledmin = 0.1 scaledmax = 0.9 +0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0.005878511 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 +>LACB_BOVIN 20 scaledmin = 0.1 scaledmax = 0.9 +0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0.006284916 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 diff -r 000000000000 -r 7653ebd919bb test-data/meme_psp_output_test1.tabular --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_psp_output_test1.tabular Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,21 @@ +meme_psp_input_pos.fa: 540 bases or amino acids +meme_psp_input_neg.fa: 540 bases or amino acids +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 4 4 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 5 5 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 6 6 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 7 7 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 8 8 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 9 9 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 10 10 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 11 11 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 12 12 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 13 13 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 14 14 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 15 15 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 16 16 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 17 17 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 18 18 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 19 19 +meme_psp_input_pos.fa meme_psp_input_neg.fa 0.5 0.5 20 20 + +score 0.9 occurred 483 times diff -r 000000000000 -r 7653ebd919bb test-data/meme_psp_protein_input.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/meme_psp_protein_input.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,15 @@ +>ICYA_MANSE +GDIFYPGYCPDVKPVNDFDLSAFAGAWHEIAKLPLENENQGKCTIAEYKY +DGKKASVYNSFVSNGVKEYMEGDLEIAPDAKYTKQGKYVMTFKFGQRVVN +LVPWVLATDYKNYAINYNCDYHPDKKAHSIHAWILSKSKVLEGNTKEVVD +NVLKTFSHLIDASKFISNDFSEAACQYSTTYSLTGPDRH +>LACB_BOVIN +MKCLLLALALTCGAQALIVTQTMKGLDIQKVAGTWYSLAMAASDISLLDA +QSAPLRVYVEELKPTPEGDLEILLQKWENGECAQKKIIAEKTKIPAVFKI +DALNENKVLVLDTDYKKYLLFCMENSAEPEQSLACQCLVRTPEVDDEALE +KFDKALKALPMHIRLSFNPTQLEEQCHI +>BBP_PIEBR +NVYHDGACPEVKPVDNFDWSNYHGKWWEVAKYPNSVEKYGKCGWAEYTPE +GKSVKVSNYHVIHGKEYFIEGTAYPVGDSKIGKIYHKLTYGGVTKENVFN +VLSTDNKNYIIGYYCKYDEDKKGHQDFVWVLSRSKVLTGEAKTAVENYLI +GSPVVDSQKLVYSDFSEAACKVN diff -r 000000000000 -r 7653ebd919bb test-data/prior30.plib --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/prior30.plib Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,275 @@ +Alphabet= ACDEFGHIKLMNPQRSTVWY +NumDistr= 30 +Number= 0 +Mixture= 0.055795 +B= 5.623820 +Alpha= 0.0855491 0.0221831 0.0111063 0.0209959 0.0505726 0.025437 0.0155389 0.132951 0.0247865 0.150287 0.0577239 0.0209317 0.0166629 0.0220905 0.0244295 0.0497608 0.070277 0.157532 0.0102219 0.0309633 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= HMM9.4 reestimated in henikoff29.2 + +Number= 1 +Mixture= 0.198333 +B= 0.097240 +Alpha= 0.0562629 0.0329597 0.0692513 0.0385232 0.0400041 0.143573 0.0428939 0.0226244 0.0442102 0.0665467 0.0117853 0.0447655 0.0833299 0.0395825 0.0611271 0.0588852 0.0513472 0.0317153 0.0237865 0.0368161 +FullUpdate= 1 +QUpdate= 1 +StructID= 24 +Comment= Outside + +Number= 2 +Mixture= 0.043566 +B= 1.648336 +Alpha= 0.0144564 0.00845337 0.00785519 0.00864933 0.255959 0.0110815 0.0509526 0.0234533 0.0120443 0.0561967 0.015111 0.0190974 0.00857653 0.0167812 0.0164918 0.0197108 0.0151013 0.0252782 0.050139 0.364613 +FullUpdate= 1 +QUpdate= 1 +StructID= 26 +Comment= Inside + +Number= 3 +Mixture= 0.060170 +B= 2.595432 +Alpha= 0.0452144 0.00587917 0.169731 0.0751478 0.00749471 0.0845832 0.0369819 0.00610072 0.0548186 0.011029 0.00382749 0.212785 0.0206532 0.0416705 0.0280716 0.117267 0.0533742 0.00943157 0.00216149 0.0137784 +FullUpdate= 1 +QUpdate= 1 +StructID= 19 +Comment= Outside Alpha + +Number= 4 +Mixture= 0.065466 +B= 3.112271 +Alpha= 0.0361167 0.0049157 0.0134924 0.0461325 0.00557631 0.0209043 0.0302551 0.016425 0.307554 0.0338255 0.0139435 0.0360733 0.0127659 0.0873761 0.222668 0.0369042 0.0354442 0.0228891 0.00434827 0.0123906 +FullUpdate= 1 +QUpdate= 1 +StructID= 21 +Comment= Outside Beta + +Number= 5 +Mixture= 0.067614 +B= 2.053644 +Alpha= 0.0194362 0.00765176 0.00188738 0.00372898 0.0849894 0.00421787 0.00400459 0.152735 0.00407958 0.4568 0.106051 0.00304386 0.00545956 0.00900935 0.00605071 0.00519029 0.016255 0.0861045 0.00787965 0.0154248 +FullUpdate= 1 +QUpdate= 1 +StructID= 22 +Comment= Inside alpha + +Number= 6 +Mixture= 0.080724 +B= 2.138987 +Alpha= 0.0423172 0.0153891 0.00409306 0.00565735 0.0197117 0.00590607 0.00139926 0.307863 0.00544884 0.115721 0.0285808 0.00522771 0.00474851 0.00328193 0.00351054 0.00892385 0.0348922 0.380003 0.00117673 0.00614917 +FullUpdate= 1 +QUpdate= 1 +StructID= 23 +Comment= Inside beta + +Number= 7 +Mixture= 0.051030 +B= 3.878926 +Alpha= 0.0548123 0.000759746 0.144127 0.46019 0.00249502 0.0192754 0.0106535 0.00938765 0.0562429 0.0163148 0.00717389 0.0245612 0.0177482 0.0744802 0.0199233 0.0323535 0.0257651 0.018574 0.00087086 0.00429088 +FullUpdate= 1 +QUpdate= 1 +StructID= 23 +Comment= Alpha helix + +Number= 8 +Mixture= 0.103529 +B= 1.486325 +Alpha= 0.315754 0.0384546 0.0116388 0.0133665 0.0111126 0.107921 0.00752325 0.0154885 0.0111281 0.0231087 0.011626 0.0228375 0.0304785 0.0166632 0.0156345 0.186379 0.0954421 0.0546691 0.00351538 0.00725682 +FullUpdate= 1 +QUpdate= 1 +StructID= 23 +Comment= Beta strand + +Number= 9 +Mixture= 0.062940 +B= 8.221215 +Alpha= 0.0869919 0.00672577 0.0600995 0.10763 0.0153489 0.0378086 0.0325335 0.023388 0.113765 0.041623 0.0196906 0.0625344 0.0262599 0.0788667 0.0707399 0.0886634 0.0666777 0.0361472 0.00484308 0.0196629 +FullUpdate= 1 +QUpdate= 1 +StructID= 23 +Comment= Other + +Number= 10 +Mixture= 0.012518 +B= 38.955631 +Alpha= 0.732922 0.0145131 0.00623235 0.00951423 0.00717778 0.0289521 0.00351664 0.0125081 0.00886593 0.0183651 0.00832812 0.00670968 0.00364556 0.00622169 0.00812899 0.0582399 0.0205067 0.0394327 0.00207485 0.00414489 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= A + +Number= 11 +Mixture= 0.004953 +B= 381.562195 +Alpha= 0.00563239 0.959814 0.00144129 0.00213042 0.00158645 0.00168393 0.000989765 0.00325263 0.00148501 0.00343924 0.00168673 0.00159054 0.00121534 0.00129942 0.00195209 0.00296106 0.0039912 0.00266944 0.000327808 0.000851203 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= C + +Number= 12 +Mixture= 0.013849 +B= 90.727570 +Alpha= 0.00897115 0.00169015 0.859473 0.0360829 0.00269485 0.00606504 0.00469816 0.00400134 0.0047981 0.00514968 0.00208395 0.029754 0.00241276 0.0045506 0.00433816 0.0088208 0.00511143 0.00527448 0.00104469 0.00298475 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= D + +Number= 13 +Mixture= 0.008388 +B= 404.591034 +Alpha= 0.00241514 0.000413991 0.0122981 0.96369 0.000665578 0.00187461 0.00106904 0.00149214 0.00121548 0.00129791 0.000554145 0.00253496 0.000624495 0.00316839 0.00115045 0.00171781 0.001468 0.0014564 0.000278652 0.000614791 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= E + +Number= 14 +Mixture= 0.008064 +B= 83.323669 +Alpha= 0.00839779 0.00428348 0.00298116 0.00358128 0.850936 0.00329382 0.00196832 0.0130534 0.00320345 0.0351883 0.00729724 0.00287304 0.00358482 0.00218728 0.00264753 0.00833798 0.00418729 0.0120684 0.00448366 0.025446 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= F + +Number= 15 +Mixture= 0.032205 +B= 32.644871 +Alpha= 0.0234448 0.00236512 0.0112957 0.00811395 0.00248143 0.868718 0.00345598 0.00342985 0.00859682 0.0040966 0.00239339 0.012342 0.00423123 0.00440054 0.00795347 0.0165095 0.0065024 0.00550512 0.00140604 0.00275817 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= G + +Number= 16 +Mixture= 0.005033 +B= 35.520824 +Alpha= 0.0100058 0.00386024 0.0131498 0.0108984 0.0122851 0.00738691 0.722249 0.00521193 0.00686054 0.0150103 0.00673014 0.0367074 0.00625526 0.0429912 0.0234127 0.0187246 0.0128445 0.00837399 0.00390723 0.0331349 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= H + +Number= 17 +Mixture= 0.007454 +B= 101.265472 +Alpha= 0.0106938 0.00267663 0.00404166 0.00466637 0.00838963 0.00372808 0.00182575 0.681615 0.0059102 0.0770333 0.0184335 0.004676 0.0027124 0.00372663 0.00418165 0.00773357 0.0109237 0.140679 0.00140417 0.00494911 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= I + +Number= 18 +Mixture= 0.009400 +B= 150.415985 +Alpha= 0.00688657 0.00169711 0.00222738 0.00346887 0.00115861 0.00302866 0.00209171 0.00400905 0.903944 0.0037747 0.00186061 0.00449531 0.00249618 0.00324487 0.041775 0.00392196 0.00461714 0.00296607 0.000893256 0.00144282 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= K + +Number= 19 +Mixture= 0.017057 +B= 31.896633 +Alpha= 0.0114646 0.00367926 0.00296188 0.00596126 0.0190009 0.00382486 0.00338381 0.0401936 0.00650072 0.790038 0.031659 0.00392791 0.0050046 0.00753591 0.00771818 0.00748621 0.0101555 0.0312597 0.00242405 0.00581952 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= L + +Number= 20 +Mixture= 0.002761 +B= 201.346268 +Alpha= 0.00353933 0.00165628 0.0014931 0.00161065 0.00279831 0.00194259 0.00101868 0.00969101 0.00211316 0.0217036 0.928022 0.00162899 0.0015681 0.0015629 0.00138977 0.00294601 0.00311476 0.00723178 0.00156295 0.00340569 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= M + +Number= 21 +Mixture= 0.005734 +B= 108.343185 +Alpha= 0.0067512 0.00239062 0.0140378 0.0043452 0.00365788 0.00689345 0.0148828 0.00715373 0.00789036 0.00614036 0.00289697 0.858995 0.00399721 0.00770961 0.00570515 0.0238176 0.011602 0.00591549 0.00167893 0.00353897 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= N + +Number= 22 +Mixture= 0.022818 +B= 15.153304 +Alpha= 0.0417987 0.00360232 0.0113792 0.0152366 0.00564775 0.0123795 0.00606957 0.0091353 0.0165122 0.0167265 0.00490487 0.00915437 0.755604 0.0131375 0.012587 0.0283392 0.0189623 0.0140029 0.0012848 0.00353553 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= P + +Number= 23 +Mixture= 0.005931 +B= 79.417511 +Alpha= 0.0142993 0.00266984 0.0053289 0.0321605 0.0028715 0.00426743 0.0257509 0.00565307 0.0106106 0.0161186 0.00955753 0.0104696 0.00638107 0.807311 0.0149106 0.0111968 0.00889459 0.00681482 0.00206658 0.00266624 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= Q + +Number= 24 +Mixture= 0.011491 +B= 93.103897 +Alpha= 0.00756896 0.00314197 0.00296652 0.00327634 0.00194604 0.00467894 0.00721049 0.00406061 0.0277257 0.00663852 0.00217868 0.00577047 0.00473306 0.00953551 0.889701 0.00650859 0.00506022 0.00294281 0.00205549 0.00230062 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= R + +Number= 25 +Mixture= 0.008219 +B= 47.504795 +Alpha= 0.0284818 0.00697155 0.00749796 0.00604665 0.00515171 0.00954817 0.00380684 0.00637929 0.0104463 0.00908885 0.00471437 0.0194592 0.00711823 0.00611827 0.00979722 0.707416 0.139256 0.00656298 0.0015377 0.00460086 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= S + +Number= 26 +Mixture= 0.019050 +B= 14.027470 +Alpha= 0.0247201 0.00718027 0.00845584 0.0076239 0.00600101 0.0073401 0.00492149 0.0173757 0.0129878 0.0125773 0.0100452 0.0230424 0.00659406 0.0110314 0.0112037 0.107763 0.690341 0.0249364 0.00193884 0.00392074 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= T + +Number= 27 +Mixture= 0.007047 +B= 76.958153 +Alpha= 0.0447488 0.00734525 0.00576457 0.00805666 0.00714188 0.00593389 0.0041663 0.0688592 0.00714299 0.0255115 0.00800708 0.00501678 0.00632646 0.00492002 0.00812967 0.0100074 0.0240134 0.745035 0.00126243 0.00261056 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= V + +Number= 28 +Mixture= 0.003957 +B= 150.973328 +Alpha= 0.00517343 0.00213336 0.00350645 0.00390297 0.018439 0.0041919 0.0023655 0.00404231 0.00420998 0.0171406 0.00379068 0.00363696 0.00245861 0.00387467 0.00502035 0.00465674 0.00417283 0.00620977 0.888513 0.012561 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= W + +Number= 29 +Mixture= 0.004904 +B= 30.653225 +Alpha= 0.0342049 0.00809912 0.0126852 0.0174701 0.156033 0.0118268 0.0431342 0.0204751 0.0164439 0.0363664 0.0129811 0.0131986 0.0103037 0.0116235 0.0159032 0.0287792 0.0176143 0.024986 0.0131845 0.494687 +FullUpdate= 1 +QUpdate= 1 +StructID= 0 +Comment= Y + +/* $Header$ */ +/* $Header$ */ +/* $Header$ */ diff -r 000000000000 -r 7653ebd919bb test-data/streme_input_neg2.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_input_neg2.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,66 @@ +>chr21_19617074_19617124_+ +AAAAATTATTACTAGGGAGGGGGCCGGAAAAACCTCGGGACGTGGGTATATAA +>chr21_26934381_26934431_+ +GCGCCTGGTCGGTTATGAGTCACAAGTGAGTTTTCCmATAAAAGGGTCGCACGTT +>chr21_28217753_28217803_- +CAAAGGGGAGGAGTGmGGGTGGGGGTGGGGGTTTCACTGGTCCACTATAAA +>chr21_31710037_31710087_- +AACACCCAGGTTTCTGAGTATATAATCGCCGCACCAAAGAATTTAATTTT +>chr21_31744582_31744632_- +CCCAGGTCTAAGAGCATATATAmACTTGGAGTCCAGACTATGACATTCAAA +>chr21_31768316_31768366_+ +AACGTATATAAATGGTCCTGTCCAGATGTGGCATGCAmAACTCAGAATCTT +>chr21_31914206_31914256_- +TGACACCCACTACTTAGAGTATAAAmATCATTCTGAGAAGTTAGAGACACC +>chr21_31933633_31933683_- +TCAGAGTATATATAAATGTTCCTGTCCAGTCACAAAGTCACCAAACTGACCT +>chr21_31962741_31962791_- +ACATATAACTCAGGTTGGATAAAATAATTTGTATCAGmCAAATCAGGAGAGTCAA +>chr21_31964683_31964733_+ +TCTGATTCACTGAGGCATATAAAAGGCCCTCTGCGGAGAmAGTGTCCATAC +>chr21_31973364_31973414_+ +aaacttaaaactctataaacttaaaactCTAGAATCCTGCTATAC +>chr21_31992870_31992920_+ +CTCATACACTATTGAAGATGTATAAAATTTCATTTGmGATGGTGACATT +>chr21_32185595_32185645_- +TCACCACCCACCAmAGCTGGGATATATAAAGAAGGTTCTGAGACTAGGAA +>chr21_32202076_32202126_- +TGCCCACCAGCTATmGTGAGGTATAAAAAGCCCTGTACGGGAAGAGACCTTCAT +>chr21_32253899_32253949_- +AGCCCCACCCACCAGCAAGGATATATAAAAGCTCAGGAGTCTGGAGTGAC +>chr21_32410820_32410870_- +TCTACCCCACTAATCACTGAGGATGTATAAAAGTCCCAGGGAAGCTGGTG +>chr21_36411748_36411798_- +ATAGTTCTGTATAAmGAGTTTCAGTTGGCATCtaaaaattatataactttattt +>chr21_37838750_37838800_- +gatggttttataaggggcctcaccctcggctcagccctcattcttctcct +>chr21_45705687_45705737_+ +CCGGGGCGGAGCGGCCTTTGCTCTTTGCGTGGTCGCGGGGGTATAACAGC +>chr21_45971413_45971463_- +CAGGCCCTGGGCATATAAAAGCCCCAGCAGmCCAACAGGctcacacacaca +>chr21_45978668_45978718_- +CAGAGGGGTATAAAGGTTCCGACCACTCAGAGGCCTGGCACGAtcactca +>chr21_45993530_45993580_+ +CCAAGGAGGAGTATAAAAGCCCCACAAACCCGAGCACCTCACTCTCGC +>chr21_46020421_46020471_+ +GAGACATATAAAAGCCAACATCCCTGAGCACCTAAACGGactcactc +>chr21_46031920_46031970_+ +GGAAAATACCCAGGGAGGGTATAAATCAGCAGCCAGGGCACACAAAC +>chr21_46046964_46047014_+ +ACAAGGCCAGGAGGGGTATAAAACTGAGAGCCCCAAGAACctcacaca +>chr21_46057197_46057247_+ +ATTGCTGAGTCTCCTGCTGGGAAAACACAGGCCCTGGGCATATAAAAGCC +>chr21_46086869_46086919_- +GACGTGTGCTTCTGTGCTGTGGGGATGCCTGGGCCCAGGTATAAAGGC +>chr21_46102103_46102153_- +AGGTGTGCTTCTGTGCTGTGGGGATGCCTGGGTCCAGGTATAAAGGCT +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGCGGGGTATAAAGGGGGCGG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGCTGCGTGAGCGTATAAAGGCCCTGGCG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGAGmGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG diff -r 000000000000 -r 7653ebd919bb test-data/streme_input_pos.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_input_pos.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,66 @@ +>chr21_19617074_19617124_+ +AAAAATTATTACTAGGGAGGGGGCCGGAACCTCGGGACGTGGGTATATAA +>chr21_26934381_26934431_+ +GCGCCTGGTCGGTTATGAGTCACAAGTGAGTTATAAAAGGGTCGCACGTT +>chr21_28217753_28217803_- +CAAAGGGGAGGAGTGGGGTGGGGGTGGGGGTTTCACTGGTCCTATAAA +>chr21_31710037_31710087_- +AACACCCAGGTTTCTGAGTATATAATCGCCGCACCAAAGAATTTAATTTT +>chr21_31744582_31744632_- +CCCAGGTCTAAGAGCATATATAACTTGGAGTCCAGACTATGACATTCAAA +>chr21_31768316_31768366_+ +AACGTATATAAATGGTCCTGTCCAGATGTG +>chr21_31914206_31914256_- +TGACACCCACTACTTAGAGTATAAAATCATTCTGAGAAGTTAGAGACACC +>chr21_31933633_31933683_- +TCAGAGTATATATAAATGTTCCTGTCCAGTCACAGTCACCAATGACCT +>chr21_31962741_31962791_- +ACATATAACTCAGGTTGGATAAAATAATTTGTACAAATCAGGAGAGTCAA +>chr21_31964683_31964733_+ +TCTGATTCACTGAGGCATATAAAAGGCCCTCTGCGGAGAAGTTAC +>chr21_31973364_31973414_+ +aaacttaaaactctataaacttaaaactCTAGAATCTGATCCTGCTATAC +>chr21_31992870_31992920_+ +CTCATACACTATTGAAGATGTATAAAATTTCATTTGCAGATGGTGACATT +>chr21_32185595_32185645_- +TCACCACCCACCAGAGCTGGGATATATAAAGAAGGTTCTAGGAA +>chr21_32202076_32202126_- +TGCCCACCAGCTTGAGGTATAAAAAGCCCTGTACGGGAAGAGACCTTCAT +>chr21_32253899_32253949_- +AGCCCCACCCACCAGCAAGGATATATAAAAGCTCAGGAGTCTGGAGTGAC +>chr21_32410820_32410870_- +TCTACCCCACTAATCACTGAGGATGTATAAAAGTCCCAGGGAAGCTGGTG +>chr21_36411748_36411798_- +ATAGTTCTGTATAGTTTCAGTTGGCATCtaaaaattatataactttattt +>chr21_37838750_37838800_- +gatggttttataaggggcctcaccctcggctcagccctcattcttctcct +>chr21_45705687_45705737_+ +CCGGGGCGGAGCGGCCTTTGCTCTTTGCGTGGTCGGGGTATAACAGC +>chr21_45971413_45971463_- +CAGGCCCTGGGCATATAAAAGCCCCAGCAGCCAACAGGctcacacacaca +>chr21_45978668_45978718_- +CAGAGGGGTATAAAGGTTCCGACCACTCCTGGCACGAtcactca +>chr21_45993530_45993580_+ +CCAAGGAGGAGTATAAAAGCCCCACAAACCCGAGCACCTCACTCACTCGC +>chr21_46020421_46020471_+ +GAGACATATAAAAGCCAACATCCCTGAGCACCTAACACACGGactcactc +>chr21_46031920_46031970_+ +GGAAAATACCCAGGGAGGGTATAAAACCTCAGCAGCCAGGGCACACAAAC +>chr21_46046964_46047014_+ +ACAAGGCCAGGAGGGGTATAAAAGCCTGAGAGCCCCAAGAACctcacaca +>chr21_46057197_46057247_+ +ATTGCTGAGTCTCCTGCTGGGAAAACACAGGCCCTGGGCATATAAAAGCC +>chr21_46086869_46086919_- +GACAGGTGTGCTTCTGTGCTGTGGGGATGCCTGGGCCCAGGTATAAAGGC +>chr21_46102103_46102153_- +AGGTGTGTGCTTCTGTGCTGTGGGGATGCCTGGGTCCAGGTATAAAGGCT +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCGGGGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGTATAAAGGGGGCGG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGGCCCTGGCG diff -r 000000000000 -r 7653ebd919bb test-data/streme_input_pos2.fasta --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_input_pos2.fasta Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,66 @@ +>chr21_19617074_19617124_+ +AAAAATTATTACTAGGGAGGGGGCmGGAACCTCGGGACGTGGGTmATATAA +>chr21_26934381_26934431_+ +GCGCCTGGTCGGTTATGAGTCACAAGTGAGTTATAAAAGGGTCGCACGTT +>chr21_28217753_28217803_- +CAAAGGGGAGGAGTGGGGTGGGGGTGGGGGTTTCACTGGTmCACTATAAA +>chr21_31710037_31710087_- +AACACCCAGGTTTCTGAGTATATAATCGCCGCACCAAAGAATTTAATTTTTT +>chr21_31744582_31744632_- +CCmAGGTCTAAGAGCATATATTAACTTGGAGTCCAGACTATGACATTCAAA +>chr21_31768316_31768366_+ +AACGTATATAAATGGTCCTGTCCAGATGTGGCATGCAAACTmAGAATCTT +>chr21_31914206_31914256_- +TGACACCCACTACTTAGAGTATAAAATCATTCTGAGAAGTTAGAGA +>chr21_31933633_31933683_- +TCAGAGTATATATAAATGTTCCTGTCCAGTCACAGTCACCAAACTGACCT +>chr21_31962741_31962791_- +ACATATAACTCAGGTTGGATAAAATAATTTGTACAAATCAGG +>chr21_31964683_31964733_+ +TCTGATTCACTGAGGCATATAAAAGGCCCTCTGCGGAGAAGTGTCCATAC +>chr21_31973364_31973414_+ +aaacttaaaactctataaacttaaaactCTAGAATCTGATCCTGCTATAC +>chr21_31992870_31992920_+ +CTCATACACTATTGAAGATGTATAAAATTTCATTTGCAGATGGTGACATT +>chr21_32185595_32185645_- +TCACCACCCACCAGAGCTGGGATATATAAAGAAGGTTCTGAGACTAGGAA +>chr21_32202076_32202126_- +TGCCCACCAGCTTGAGGTATAAAAAGCCCTGTACGGGAAGAGACCTTCAT +>chr21_32253899_32253949_- +AGCCCCACCCACCAGCAAGGATATATAAAAGCTCAGGAGTCTGGAGTGAC +>chr21_32410820_32410870_- +TCTACCCCACTAATCACTGAGGATGTATAAAAGTCCCAGGGAAGCTGGTG +>chr21_36411748_36411798_- +ATAGTTCTGTATAGTTTCAGTTGGCATCtaaaaattatataactttattt +>chr21_37838750_37838800_- +gatggttttataaggggcctcaccctcggctcagccctcattcttctcct +>chr21_45705687_45705737_+ +CCGGGGCGGAGCGGCCTTTGCTCTTTGCGTGGTCGCGGGmGGTATAACAGC +>chr21_45971413_45971463_- +CAGGCCCTGGGCATATAAAAGCCCCAGCAGCCAACAGGctcacacacaca +>chr21_45978668_45978718_- +CAGAGGGGTATAAAGGTTCCGACCACTCAGAGGCCTGGCACGAtcactca +>chr21_45993530_45993580_+ +CCAAGGAGGAGTATAAAAGCCCCACAAACCCGAGCACCmTCACTCACTCGC +>chr21_46020421_46020471_+ +GAGACATATAAAAGCCAACATCCCTGAGCACCTAACACACGGactcactc +>chr21_46031920_46031970_+ +GGAAAATACCCAGGGAGGGTATAAAACCTCAGCAGCCAGGGCACACAAAC +>chr21_46046964_46047014_+ +ACAAGGCCAGGAGGGGTATAAAAGCCTGAGAGCCCCAAGAACctcacaca +>chr21_46057197_46057247_+ +ATTGCTGAGTCTCCTGCTGGGAAAACACAGGCCCTGGGCAT +>chr21_46086869_46086919_- +GACAGGTGTGCTTCTGTGCTGTGGGGATGCCTGGGCCCAGGTATAAAGGC +>chr21_46102103_46102153_- +AGGTGTGTGCTTCTGTGCTGTGGGGATGCCTCCAGGTATAAAGGCT +>chr21_47517957_47518007_+ +CCTGGCGGCGGGGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGGmGG +>chr21_47517957_47518007_+ +CCTGGCGGCGmGGGCGGGTCAGGCCGGCGGGmGCGGGGTATAAAGGGGGCGG +>chr21_47517957_47518007_+ +CCTGGCGGCGGGmGCGGGTCAGGCCGGCGGGGCGGGGTATAAAGGGGmGCGG +>chr21_47575506_47575556_- +TGAGAAGCCGGTGGGGAGGTGmTGCCGGTGAGCmGTATAAAGGCCCTGGCG +>chr21_47575506_47575556_- +TGAGAAGCmGGTGGGGAGGTGCTGCCGGTGAGCGTATAAAGmGCCCTGGCG diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test1.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test1.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,39 @@ + "train_negatives": { + "from": "shuffled", + "count": 33, + "positions": 1597 + }, + "test_positives": { + "count": 0, + "positions": 0 + }, + "test_negatives": { + "count": 0, + "positions": 0 + }, + "sequence_db": { + "freqs": [0.245, 0.255, 0.255, 0.245] + }, + "motifs": [ + { + "db": 0, + "id": "1-CTTTTATAYRCCY", + "alt": "STREME-1", + "width": 13, + "initial_width": 8, + "seed": "CTTTTATATGCCT", + "score_threshold": 10.1927, + "npassing": 18, + "train_pos_count": 18, + "train_neg_count": 0, + "train_log_pvalue": -6.81978, + "train_pvalue": "1.5e-007", + "train_dtc": -1.0, + "train_bernoulli": -1, + "test_pos_count": 0, + "test_neg_count": 0, + "test_log_pvalue": 0, + "test_pvalue": "1.0e+000", + "test_log_evalue": 0.69897, + "test_evalue": "5.0e+000", + "test_dtc": -1.0, \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test1.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test1.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,93 @@ +******************************************************************************** +STREME - Sensitive, Thorough, Rapid, Enriched Motif Elicitation +******************************************************************************** +MEME version 5.5.8 (Release date: Thu May 15 15:01:46 2025 -0700) + +For further information on how to interpret these results please access https://meme-suite.org/meme. +To get a copy of the MEME Suite software please access https://meme-suite.org. + +******************************************************************************** + + +******************************************************************************** +REFERENCE +******************************************************************************** +If you use this program in your research, please cite: + +Timothy L. Bailey, +"STREME: accurate and versatile sequence motif discovery", +Bioinformatics, Mar. 24, 2021. +******************************************************************************** + + +ALPHABET= ACGT + +strands: + - + +Background letter frequencies +A 0.244 C 0.256 G 0.256 T 0.244 + +MOTIF 1-CTTTTATAYRCCY STREME-1 +letter-probability matrix: alength= 4 w= 13 nsites= 18 S= 1.5e-007 + 0.072963 0.851476 0.002598 0.072963 + 0.072963 0.145128 0.002598 0.779311 + 0.002486 0.002598 0.073075 0.921841 + 0.002486 0.002598 0.002598 0.992318 + 0.002486 0.002598 0.002598 0.992318 + 0.992318 0.002598 0.002598 0.002486 + 0.002486 0.002598 0.073075 0.921841 + 0.992318 0.002598 0.002598 0.002486 + 0.002486 0.497514 0.002598 0.497402 + 0.284394 0.143552 0.499090 0.072963 + 0.002486 0.710522 0.002598 0.284394 + 0.002486 0.779422 0.073075 0.145017 + 0.072963 0.428613 0.073075 0.425349 + +MOTIF 2-CCCCACCRSC STREME-2 +letter-probability matrix: alength= 4 w= 10 nsites= 12 S= 7.2e-005 + 0.139001 0.787776 0.070814 0.002409 + 0.070705 0.924368 0.002517 0.002409 + 0.002409 0.924368 0.070814 0.002409 + 0.002409 0.992664 0.002517 0.002409 + 0.716267 0.002517 0.210510 0.070705 + 0.002409 0.856072 0.070814 0.070705 + 0.208825 0.786248 0.002517 0.002409 + 0.343890 0.030359 0.555046 0.070705 + 0.070705 0.376471 0.550414 0.002409 + 0.208825 0.786248 0.002517 0.002409 + +MOTIF 3-RCAGAAKCA STREME-3 +letter-probability matrix: alength= 4 w= 9 nsites= 10 S= 4.4e-004 + 0.595835 0.003626 0.397069 0.003470 + 0.003470 0.694352 0.298708 0.003470 + 0.792557 0.003626 0.101987 0.101831 + 0.003470 0.101987 0.891074 0.003470 + 0.694196 0.003626 0.298708 0.003470 + 0.694196 0.298708 0.003626 0.003470 + 0.003470 0.101987 0.300909 0.593635 + 0.101831 0.792713 0.003626 0.101831 + 0.989279 0.003626 0.003626 0.003470 + +MOTIF 4-RAGTTATAAA STREME-4 +letter-probability matrix: alength= 4 w= 10 nsites= 8 S= 2.4e-003 + 0.333562 0.113112 0.440386 0.112939 + 0.988110 0.004021 0.004021 0.003848 + 0.003848 0.004021 0.879191 0.112939 + 0.003848 0.004021 0.222204 0.769927 + 0.112939 0.004021 0.004021 0.879018 + 0.769927 0.004021 0.113112 0.112939 + 0.003848 0.004021 0.113112 0.879018 + 0.988110 0.004021 0.004021 0.003848 + 0.549304 0.113112 0.113112 0.224471 + 0.769927 0.004021 0.113112 0.112939 + +MOTIF 5-AACCTCGG STREME-5 +letter-probability matrix: alength= 4 w= 8 nsites= 7 S= 5.5e-003 + 0.973700 0.008894 0.008894 0.008511 + 0.732403 0.250191 0.008894 0.008511 + 0.008511 0.974083 0.008894 0.008511 + 0.008511 0.974083 0.008894 0.008511 + 0.008511 0.008894 0.008894 0.973700 + 0.008511 0.732786 0.250191 0.008511 + 0.249809 0.008894 0.732786 0.008511 + 0.008511 0.008894 0.974083 0.008511 \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test1.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test1.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,26 @@ + + + + + + + + + + + + + + + + + both + + + + 0.244 + 0.256 + 0.256 + 0.244 + + \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test2.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test2.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,43 @@ + "train_negatives": { + "from": "shuffled", + "count": 33, + "positions": 1597 + }, + "test_positives": { + "count": 0, + "positions": 0 + }, + "test_negatives": { + "count": 0, + "positions": 0 + }, + "sequence_db": { + "freqs": [ + 0.218, 0.24, 0.24, 0.218, 0.0266, 0.0125, 0, 0.00313, 0, 0, + 0.0266, 0, 0, 0, 0.0125, 0.00313 + ] + }, + "motifs": [ + { + "db": 0, + "id": "1-GTATAAAAGC", + "alt": "STREME-1", + "width": 10, + "initial_width": 5, + "seed": "GTATAAAGGC", + "score_threshold": 9.73039, + "npassing": 28, + "train_pos_count": 28, + "train_neg_count": 0, + "train_log_pvalue": -13.1578, + "train_pvalue": "7.0e-014", + "train_dtc": -1.0, + "train_bernoulli": -1, + "test_pos_count": 0, + "test_neg_count": 0, + "test_log_pvalue": 0, + "test_pvalue": "1.0e+000", + "test_log_evalue": 0.477121, + "test_evalue": "3.0e+000", + "test_dtc": -1.0, + "test_bernoulli": -1, \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test2.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test2.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,78 @@ +******************************************************************************** +STREME - Sensitive, Thorough, Rapid, Enriched Motif Elicitation +******************************************************************************** +MEME version 5.5.8 (Release date: Thu May 15 15:01:46 2025 -0700) + +For further information on how to interpret these results please access https://meme-suite.org/meme. +To get a copy of the MEME Suite software please access https://meme-suite.org. + +******************************************************************************** + + +******************************************************************************** +REFERENCE +******************************************************************************** +If you use this program in your research, please cite: + +Timothy L. Bailey, +"STREME: accurate and versatile sequence motif discovery", +Bioinformatics, Mar. 24, 2021. +******************************************************************************** + + +******************************************************************************** +ALPHABET "DNA with covalent modifications" DNA-LIKE +******************************************************************************** +A "Adenine" 8510A8 ~ T "Thymine" A89610 +C "Cytosine" A50026 ~ G "Guanine" 313695 +a "N6-methyladenine" 8510A8 ~ t "Thymine_lowercase" 756BB1 +c "5-Carboxylcytosine" FEE090 ~ 4 "Guanine:5-Carboxylcytosine" E0F3F8 +f "5-Formylcytosine" FDAE61 ~ 3 "Guanine:5-Formylcytosine" ABD9E9 +g "modified_g" 00897B ~ 5 "cytosine_lowercase" 53698A +h "5-Hydroxymethylcytosine" F46D43 ~ 2 "Guanine:5-Hydroxymethylcytosine" 74ADD1 +m "5-Methylcytosine" D73027 ~ 1 "Guanine:5-Methylcytosine" 4575B4 +? = ACGTacfghmt12345 +******************************************************************************** + +strands: + - + +Background letter frequencies +A 0.218 C 0.24 G 0.24 T 0.218 a 0.0266 c 0.0125 f 1.96e-05 g 0.00315 h 1.96e-05 m 1.96e-05 t 0.0266 1 1.96e-05 2 1.96e-05 3 1.96e-05 4 0.0125 5 0.00315 + +MOTIF 1-GTATAAAAGC STREME-1 +letter-probability matrix: alength= 16 w= 10 nsites= 28 S= 7.0e-014 + 0.344606 0.001172 0.618858 0.034950 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.001065 0.001172 0.001172 0.996177 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.996177 0.001172 0.001172 0.001065 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.001065 0.001172 0.001172 0.996177 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.996177 0.001172 0.001172 0.001065 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.928407 0.001172 0.035057 0.034950 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.860638 0.136711 0.001172 0.001065 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.548672 0.001172 0.313139 0.136603 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.068834 0.068941 0.725207 0.136603 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + 0.068834 0.485705 0.308443 0.136603 0.000130 0.000061 0.000000 0.000015 0.000000 0.000000 0.000130 0.000000 0.000000 0.000000 0.000061 0.000015 + +MOTIF 2-CCCACCAGA STREME-2 +letter-probability matrix: alength= 16 w= 9 nsites= 20 S= 2.2e-007 + 0.001482 0.947685 0.048775 0.001482 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.143970 0.805197 0.048775 0.001482 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.095771 0.711962 0.143064 0.048626 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.947536 0.001631 0.048775 0.001482 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.095771 0.710908 0.191263 0.001482 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.001482 0.900540 0.001631 0.095771 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.663614 0.095920 0.096974 0.142915 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.095771 0.332697 0.569474 0.001482 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + 0.473982 0.239462 0.143064 0.142915 0.000181 0.000085 0.000000 0.000021 0.000000 0.000000 0.000181 0.000000 0.000000 0.000000 0.000085 0.000021 + +MOTIF 3-4a4t4a4a4T STREME-3 +letter-probability matrix: alength= 16 w= 10 nsites= 7 S= 5.5e-003 + 0.004400 0.004842 0.004842 0.004400 0.140510 0.000253 0.000000 0.000064 0.000000 0.000000 0.000537 0.000000 0.000000 0.000000 0.840087 0.000064 + 0.004400 0.004842 0.004842 0.004400 0.700399 0.000253 0.000000 0.000064 0.000000 0.000000 0.280482 0.000000 0.000000 0.000000 0.000253 0.000064 + 0.004400 0.004842 0.004842 0.004400 0.000537 0.000253 0.000000 0.000064 0.000000 0.000000 0.000537 0.000000 0.000000 0.000000 0.980059 0.000064 + 0.004400 0.004842 0.004842 0.004400 0.000537 0.000253 0.000000 0.000064 0.000000 0.000000 0.840371 0.000000 0.000000 0.000000 0.140226 0.000064 + 0.004400 0.004842 0.004842 0.004400 0.000537 0.000253 0.000000 0.000064 0.000000 0.000000 0.280482 0.000000 0.000000 0.000000 0.700115 0.000064 + 0.004400 0.004842 0.004842 0.004400 0.560427 0.000253 0.000000 0.000064 0.000000 0.000000 0.420454 0.000000 0.000000 0.000000 0.000253 0.000064 + 0.004400 0.004842 0.004842 0.144372 0.000537 0.000253 0.000000 0.000064 0.000000 0.000000 0.280482 0.000000 0.000000 0.000000 0.560142 0.000064 + 0.004400 0.144814 0.144814 0.004400 0.420454 0.000253 0.000000 0.000064 0.000000 0.000000 0.280482 0.000000 0.000000 0.000000 0.000253 0.000064 + 0.004400 0.144814 0.144814 0.144372 0.140510 0.000253 0.000000 0.000064 0.000000 0.000000 0.140510 0.000000 0.000000 0.000000 0.280198 0.000064 + 0.004400 0.144814 0.004842 0.284344 0.280482 0.000253 0.000000 0.000064 0.000000 0.000000 0.000537 0.000000 0.000000 0.000000 0.280198 0.000064 \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test2.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test2.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,39 @@ + + + + + + + + + + + + + + + + + + + + both + + + + 0.218 + 0.24 + 0.24 + 0.218 + 0.0266 + 0.0125 + 1.96e-05 + 0.00315 + 1.96e-05 + 1.96e-05 + 0.0266 + 1.96e-05 + 1.96e-05 + 1.96e-05 + 0.0125 + 0.00315 \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test3.html --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test3.html Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,38 @@ + "max_sites": 2, + "site_hist": [0, 6, 1], + "len": 5, + "nsites": 7, + "evalue": "0", + "pwm": [ + [ + 0.00775938, 0.00626088, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.979973, 8.41549e-07, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.000219631, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 8.41549e-07, 0.00577435, 8.41549e-07, + 8.41549e-07, 8.41549e-07 + ], [ + 0.00775938, 0.588717, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.397517, 8.41549e-07, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.000219631, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 8.41549e-07, 0.00577435, 8.41549e-07, + 8.41549e-07, 8.41549e-07 + ], [ + 0.00775938, 0.00626088, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.00777606, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 0.972417, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 8.41549e-07, 0.00577435, 8.41549e-07, + 8.41549e-07, 8.41549e-07 + ], [ + 0.00775938, 0.00626088, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.979973, 8.41549e-07, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.000219631, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 8.41549e-07, 0.00577435, 8.41549e-07, + 8.41549e-07, 8.41549e-07 + ], [ + 0.00775938, 0.00626088, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.787258, 8.41549e-07, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 0.000219631, 8.41549e-07, 8.41549e-07, 8.41549e-07, + 8.41549e-07, 8.41549e-07, 0.19849, 8.41549e-07, 8.41549e-07, + 8.41549e-07 + ] + ] \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test3.txt --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test3.txt Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,79 @@ +******************************************************************************** +STREME - Sensitive, Thorough, Rapid, Enriched Motif Elicitation +******************************************************************************** +MEME version 5.5.8 (Release date: Thu May 15 15:01:46 2025 -0700) + +For further information on how to interpret these results please access https://meme-suite.org/meme. +To get a copy of the MEME Suite software please access https://meme-suite.org. + +******************************************************************************** + + +******************************************************************************** +REFERENCE +******************************************************************************** +If you use this program in your research, please cite: + +Timothy L. Bailey, +"STREME: accurate and versatile sequence motif discovery", +Bioinformatics, Mar. 24, 2021. +******************************************************************************** + + +ALPHABET= ACDEFGHIKLMNPQRSTVWY + +strands: + + +Background letter frequencies +A 0.279 C 0.225 D 3.03e-05 E 3.03e-05 F 3.03e-05 G 0.28 H 3.03e-05 I 3.03e-05 K 3.03e-05 L 3.03e-05 M 0.0079 N 3.03e-05 P 3.03e-05 Q 3.03e-05 R 3.03e-05 S 3.03e-05 T 0.208 V 3.03e-05 W 3.03e-05 Y 3.03e-05 + +MOTIF 1-GCMGG STREME-1 +letter-probability matrix: alength= 20 w= 5 nsites= 7 S= 5.5e-003 + 0.007759 0.006261 0.000001 0.000001 0.000001 0.979973 0.000001 0.000001 0.000001 0.000001 0.000220 0.000001 0.000001 0.000001 0.000001 0.000001 0.005774 0.000001 0.000001 0.000001 + 0.007759 0.588717 0.000001 0.000001 0.000001 0.397517 0.000001 0.000001 0.000001 0.000001 0.000220 0.000001 0.000001 0.000001 0.000001 0.000001 0.005774 0.000001 0.000001 0.000001 + 0.007759 0.006261 0.000001 0.000001 0.000001 0.007776 0.000001 0.000001 0.000001 0.000001 0.972417 0.000001 0.000001 0.000001 0.000001 0.000001 0.005774 0.000001 0.000001 0.000001 + 0.007759 0.006261 0.000001 0.000001 0.000001 0.979973 0.000001 0.000001 0.000001 0.000001 0.000220 0.000001 0.000001 0.000001 0.000001 0.000001 0.005774 0.000001 0.000001 0.000001 + 0.007759 0.006261 0.000001 0.000001 0.000001 0.787258 0.000001 0.000001 0.000001 0.000001 0.000220 0.000001 0.000001 0.000001 0.000001 0.000001 0.198490 0.000001 0.000001 0.000001 + +MOTIF 2-GGTMA STREME-2 +letter-probability matrix: alength= 20 w= 5 nsites= 6 S= 5.2e-002 + 0.166242 0.005192 0.000001 0.000001 0.000001 0.823585 0.000001 0.000001 0.000001 0.000001 0.000182 0.000001 0.000001 0.000001 0.000001 0.000001 0.004788 0.000001 0.000001 0.000001 + 0.006434 0.164999 0.000001 0.000001 0.000001 0.823585 0.000001 0.000001 0.000001 0.000001 0.000182 0.000001 0.000001 0.000001 0.000001 0.000001 0.004788 0.000001 0.000001 0.000001 + 0.006434 0.005192 0.000001 0.000001 0.000001 0.006448 0.000001 0.000001 0.000001 0.000001 0.000182 0.000001 0.000001 0.000001 0.000001 0.000001 0.981733 0.000001 0.000001 0.000001 + 0.006434 0.277760 0.000001 0.000001 0.000001 0.166256 0.000001 0.000001 0.000001 0.000001 0.479605 0.000001 0.000001 0.000001 0.000001 0.000001 0.069935 0.000001 0.000001 0.000001 + 0.823572 0.164999 0.000001 0.000001 0.000001 0.006448 0.000001 0.000001 0.000001 0.000001 0.000182 0.000001 0.000001 0.000001 0.000001 0.000001 0.004788 0.000001 0.000001 0.000001 + +MOTIF 3-GTATAAAATCA STREME-3 +letter-probability matrix: alength= 20 w= 11 nsites= 8 S= 9.3e-002 + 0.008845 0.007137 0.000001 0.000001 0.000001 0.977170 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.006583 0.000001 0.000001 0.000001 + 0.008845 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.974888 0.000001 0.000001 0.000001 + 0.977151 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.006583 0.000001 0.000001 0.000001 + 0.008845 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.974888 0.000001 0.000001 0.000001 + 0.977151 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.006583 0.000001 0.000001 0.000001 + 0.757464 0.007137 0.000001 0.000001 0.000001 0.228552 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.006583 0.000001 0.000001 0.000001 + 0.757464 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.226270 0.000001 0.000001 0.000001 + 0.757464 0.007137 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.226270 0.000001 0.000001 0.000001 + 0.008845 0.226824 0.000001 0.000001 0.000001 0.228552 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.535514 0.000001 0.000001 0.000001 + 0.008845 0.885886 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.096140 0.000001 0.000001 0.000001 + 0.448220 0.226824 0.000001 0.000001 0.000001 0.008864 0.000001 0.000001 0.000001 0.000001 0.000250 0.000001 0.000001 0.000001 0.000001 0.000001 0.315827 0.000001 0.000001 0.000001 + +MOTIF 4-GAGGTG STREME-4 +letter-probability matrix: alength= 20 w= 6 nsites= 5 S= 9.8e-002 + 0.007829 0.200766 0.000001 0.000001 0.000001 0.785344 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.005826 0.000001 0.000001 0.000001 + 0.979776 0.006317 0.000001 0.000001 0.000001 0.007846 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.005826 0.000001 0.000001 0.000001 + 0.202278 0.041933 0.000001 0.000001 0.000001 0.670460 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.085095 0.000001 0.000001 0.000001 + 0.007829 0.200766 0.000001 0.000001 0.000001 0.785344 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.005826 0.000001 0.000001 0.000001 + 0.007829 0.006317 0.000001 0.000001 0.000001 0.007846 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.977773 0.000001 0.000001 0.000001 + 0.087098 0.006317 0.000001 0.000001 0.000001 0.900525 0.000001 0.000001 0.000001 0.000001 0.000222 0.000001 0.000001 0.000001 0.000001 0.000001 0.005826 0.000001 0.000001 0.000001 + +MOTIF 5-TCACACACA STREME-5 +letter-probability matrix: alength= 20 w= 9 nsites= 5 S= 9.8e-002 + 0.007502 0.192368 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.792388 0.000001 0.000001 0.000001 + 0.193817 0.716905 0.000001 0.000001 0.000001 0.083471 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.005583 0.000001 0.000001 0.000001 + 0.794307 0.006053 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.191898 0.000001 0.000001 0.000001 + 0.007502 0.903220 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.081536 0.000001 0.000001 0.000001 + 0.794307 0.006053 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.191898 0.000001 0.000001 0.000001 + 0.007502 0.792858 0.000001 0.000001 0.000001 0.193833 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.005583 0.000001 0.000001 0.000001 + 0.718354 0.082006 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.191898 0.000001 0.000001 0.000001 + 0.007502 0.979173 0.000001 0.000001 0.000001 0.007518 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.005583 0.000001 0.000001 0.000001 + 0.532038 0.006053 0.000001 0.000001 0.000001 0.193833 0.000001 0.000001 0.000001 0.000001 0.000212 0.000001 0.000001 0.000001 0.000001 0.000001 0.267851 0.000001 0.000001 0.000001 diff -r 000000000000 -r 7653ebd919bb test-data/streme_output_test3.xml --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/test-data/streme_output_test3.xml Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,73 @@ + + + + + + + + + + + + + + + + + + + + + + + + + + none + + + + 0.279 + 0.225 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 0.28 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 0.0079 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 3.03e-05 + 0.208 + 3.03e-05 + 3.03e-05 + 3.03e-05 + + + + Differential Enrichment + Fisher Exact Test + 5 + 20 + 1 + 0.1 + 25 + 4 + 20 + 3 + 0 + no + no + 0 + 5 + 1 + 0.85 + 5 + no + no + 0 \ No newline at end of file diff -r 000000000000 -r 7653ebd919bb tool_data_table_conf.xml.sample --- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/tool_data_table_conf.xml.sample Mon Jul 14 21:33:08 2025 +0000 @@ -0,0 +1,7 @@ + + + + value, dbkey, name, path + +
+