Figure S2: Top motif from PosMotif2 on samples of type real from the Tompa data set in Tompa's format >data set dm01r >instances seq_0,-197,CGCCGGCTGAGCAGCCT seq_1,-986,CGCCGCATGTGAGGGGT seq_2,-1104,CGCCGACTGCGCTGGAT seq_3,-112,CGCCGGATAAGCTGGAT >data set dm02r >instances seq_0,-1341,CCATCGCCATC seq_0,-1273,CCAATCCCGATCCCTAGCCCGATCCCAATCCCAATCCCAATCCC seq_0,-968,CACTATCCCGGTCC seq_0,-496,CCGTCCCGCTC seq_0,-329,CCATCCCGCTGC seq_0,-207,CTGTCCCGCTC >data set dm03r >instances seq_0,-599,GAATTCCCGTCGATC seq_0,-218,GAATGGCCGTCGAGC seq_2,-1540,GAACACCCGCGGATC seq_2,-533,GAAACCCCGAGGAGC >data set dm04r >instances seq_0,-91,GAACTCTCTCTCTTGCTC seq_1,-776,GCTCTCCCCCTC seq_1,-320,GATCTCGCCCTCTCGCTC seq_1,-293,GACCTCTCTTTC seq_2,-414,GAACTCTCTCTCTCTC seq_3,-483,GATCGCTCTCTCACTC >data set dm05r >instances seq_2,-2383,CCCCACCCCCCCACCA seq_2,-2011,CCCCAACCCCCCACCA >data set dm06r >instances seq_0,-2829,ATATTTTCAGATAT seq_0,-1955,ATATTTCCAAATAT seq_0,-961,TATCTCCATATAT seq_0,-838,ATATCTCCTAATAT seq_0,-258,ATATATACATATAT >data set hm01r >instances seq_5,-1870,CTGTAATCCCAGCTACTCGGGA seq_7,-1910,CTGTAGTCCCAGCTATTCAGGA seq_8,-1993,CTGTAATCCCAGCACTTTGGGA seq_8,-1842,CTGTAGTCCCAGCTACTCGGGA seq_10,-1371,CTGTAATCCCAGCACTTTGGGA seq_10,-1235,CTGTAATCCCAGCTATTCAGGA seq_13,-1464,CTGTAATCCCAGCACTTTGGGA seq_15,-1532,CTGTAATCCTAGCACTTTGAGA seq_16,-1926,CTGTAACCCCAGCTACTGAGGA seq_16,-1756,CTGTAATCCCAACACTTTGGG seq_16,-1623,CTGTAATCCCAGCTACTCAGGA >data set hm02r >instances seq_4,-896,CCTCCCAAAGTGCTGGGATTACAGG seq_5,-850,CCTCCCAAAGTGCTGGGATTACAGG >data set hm03r >instances seq_0,-575,CCCAGCTTAGTGCCTGACACACAGAGGGG seq_1,-556,CCCAGCTTAGTGCCTGACACAGGGAGGTG seq_2,-595,CCCAGCTTAGTGCCTGACACAGGGAGATG >data set hm04r >instances seq_0,-1502,TGCCCAGGCTAGAGTGCAGTGG seq_1,-1215,CCGGCCGGGAGTGCAGAG seq_2,-841,TGCCTAGGCTGGAGTGCAGCGGC seq_5,-191,CGCGGCCCGTGTGCAGAG seq_9,-1189,TCGCCAGGCTGGAGTGCAGTGGC seq_10,-1125,TGCCCAGGCTGGAGTGCAGTGGC >data set hm05r >instances seq_1,-463,CCGGGCGACCGCGGTG seq_1,-210,CAGGGCGACCGCGGAG >data set hm06r >instances seq_0,-269,CCGCCTCGGGCTCCACCC seq_0,-191,CCGCCGCGTAGCCACACC seq_1,-136,CCGCCCCGCCCCTGCGCC seq_1,-21,CGGCCGCGGCCAGAAAC seq_2,-264,CCGCCGCGTTGAGAACC seq_2,-232,CGGCCACGTGACCAGTCC seq_3,-38,CAGCCGCGCGCCCCTTCC seq_4,-379,CTGCCGCGGGCCGGGGCC seq_5,-444,CGGCCTCGCCTGTGACCC seq_5,-229,CCGCCCCGGCGCGCCTC seq_5,-162,CCGCCCCGCGCCGCCCGCCCCGTCCGCGCACC seq_7,-336,GCCACGACGGTCCCCC seq_7,-206,CAGCCTCGAGTGTACACC seq_8,-496,GCCCCGCGTCCGGACC seq_8,-110,CCGCCCCGTCCCGACCCC seq_8,-34,CGGCCCCGCCCTCTCCTC >data set hm07r >instances seq_1,-465,CTGAGAAGCAAA seq_2,-610,CTGAGAAGACAA seq_3,-923,CTGAGAAGTGAA seq_4,-81,CTCAGAAGGGAA >data set hm08r >instances seq_0,-55,ACGTC seq_1,-29,ATGACGTGT seq_2,-66,CGTGACGTTT seq_3,-240,ATGACGTCA seq_4,-182,ATGACGTC seq_5,-426,TGACG seq_5,-183,CGTGACGTCA seq_6,-257,TTACGT seq_6,-219,TGACCTTGTCGT seq_6,-175,TGACCT seq_6,-142,TGACGTCA seq_6,-124,TGACGTCA seq_7,-198,TGACGAC seq_8,-476,TGACAT seq_8,-346,TGACTT seq_8,-97,TGACAT seq_9,-305,ACGTC seq_9,-102,CATGACGTCT seq_10,-113,TGACAT seq_11,-81,GTGACGTCT seq_12,-233,GTGACGT seq_12,-82,TGACGGC seq_12,-32,CGTGACGT seq_13,-254,TGACAT seq_13,-245,TGACTT seq_13,-86,TGTCGT seq_14,-253,TGGCGT >data set hm09r >instances seq_0,-1121,CGGGCTCCCGTAAGCAC seq_0,-227,GGGCCCACGAGACCTCT seq_0,-105,GCCCGCGCGCCACCCCT seq_1,-232,GAGCGCCCGAGTGCTCT seq_1,-194,CGCCCTGCCGAAGACCC seq_2,-304,CGCACTCCCGTTTCCCCT seq_3,-702,CGTTCGCCCGCTGGCCCT seq_4,-1170,CGCACACCTGTAGTCCC seq_4,-1058,CGAGATTCCGTCTCCCC seq_5,-604,CGTCCGCCAGCACACCCGGGCCCGCT seq_6,-486,GCCCCCACGCTCCCTCT seq_6,-196,CGCCCGCCCGCCCGCCCT seq_6,-83,CGCCTTCCCGCCCGCCC seq_7,-440,GCACACACGTGTGCGCT seq_7,-303,CGCGCTCCCGGCGCCCCT seq_8,-373,GAGCTCCCGCCACCAC >data set hm10r >instances seq_0,-357,CAGGCTGGGCC seq_1,-48,CGGGCTTTGGC seq_2,-350,CCGGCTGAGTC seq_3,-389,CAGGCTGGGAC seq_4,-195,CCGGCTGGGCC seq_5,-123,CGGGCTGCGGC >data set hm11r >instances seq_0,-510,CAAAGTAGCCAAT seq_3,-741,CTGAACAGCTAAT seq_4,-80,CCTATCAGCTGAT seq_5,-481,CACACCAGCTAAT seq_6,-426,CTCAACAGCCCAT seq_7,-583,CCTATTAGCACAT >data set hm12r >instances seq_0,-150,GATCAAATTGACGTCATGGTAAAAATTGACGTCATGGTAA >data set hm13r >instances seq_0,-734,TTAACTGAAGATCCCA seq_0,-333,AACTAAATTGCAAA seq_1,-560,TTAACTCAAAAACGGA seq_2,-549,TAACTAACCTGCACA seq_3,-745,TCAACTGAACAGCTAA seq_4,-222,TTAACTGAGGGCCTGA seq_5,-167,TTAACTTAGATTCCCA >data set hm14r >instances seq_1,-365,CACCATGAGCTTTCCATG seq_1,-160,CACCATGAGTCTTCCATG >data set hm15r >instances seq_1,-1915,CACACCTGTAGTCCCAGCTATTCAG seq_2,-1168,CACACCTGTAGTCCCAGCTACTCGG >data set hm16r >instances seq_0,-2252,CCAGGCTGCAGTGCAGTGGTGCGAT seq_1,-1886,CCAGGCTGGAGTGCAGTGCCTCTAT seq_4,-2547,CCAGGCTGGAGTGCAGTGGCGCGAT seq_4,-1910,CCAGGCTGGAGTGCAGTGGCGCGAT seq_5,-2732,CCAGGCTGGAGTGCAGTGGCACGAT seq_6,-2451,CCAGGCTGGAGTGCCGTGGCGCGAT >data set hm17r >instances seq_0,-101,ACTCGGGATCGATCTGGAACTC seq_1,-101,ACTCGGGATCGATCTGGAGCTC seq_2,-103,ACTCCGGATCGATCTGGAGCT >data set hm18r >instances seq_0,-330,GCCACCGCACTCCAGCCTGGG seq_1,-2707,GCCACTGCACTCCAGCCTGGG seq_3,-1878,GCCACTGCACTCCAGCCTGGG >data set hm19r >instances seq_0,-406,CTACCACCACCCCCAA seq_2,-365,CTACCACCACCCACAA >data set hm20r >instances seq_2,-1432,TGTAATCCCAGC seq_3,-1634,GCTGGGTTTACA seq_3,-1498,GCTGGGATTACAG seq_4,-591,CTAGGATTACA seq_4,-457,GCTGGGATTACAG seq_5,-1563,GGTGGGATTACAG seq_5,-1425,CTAGGATTACA seq_5,-1105,TGTAGTACCAGC seq_5,-1031,GCTGTGATTACA seq_5,-328,GCTGGCATTACA seq_6,-1685,CTGGGATTACAG seq_6,-750,TGTAATCCCAGC seq_7,-1317,TGGAATCCCAG seq_12,-1675,TGTAATCCCAGC seq_14,-798,TGTAATCCCAGC seq_15,-1909,TGTAGTCCCAGC seq_15,-384,GCTGGGATTACA seq_18,-1566,TGTAATCCCAGC seq_19,-1614,GTTGGGATTACAG seq_19,-1019,CTGGGAATACA seq_19,-885,GCTGGGATTACAG seq_21,-1409,TGTAATCCCAGC seq_22,-1992,TGTAATCCCAGC seq_22,-1841,TGTAGTCCCAGC seq_22,-974,GCTGAGATTACA seq_22,-839,GCTGGGATTACAG seq_23,-1934,TGTAATCCCAGC seq_24,-1516,GCTGGGATTACAG seq_24,-1310,CTTGGATTACA seq_24,-372,GCTGAGATTACA seq_25,-1867,GCTGGGATTACAG seq_25,-1731,GCTGAGATTACA seq_29,-1370,TGTAATCCCAGC seq_29,-1234,TGTAATCCCAGC seq_29,-623,GCTGGGATTACA seq_31,-1989,GCTGGGATTACAG seq_31,-1842,GCTGGGATTACAG seq_32,-1688,TGTAGTCCCAGC seq_32,-1534,TGTAGTACCAGC seq_32,-1511,TGTAATCCCAGC seq_32,-789,GCTGGGATTACAG seq_32,-668,CTAGGATTACA seq_34,-1240,TGTAGTCCCAGC seq_34,-1062,TGTAATCCCAGC seq_34,-916,TGTAATCCCAGC seq_34,-785,TGTAATCCCAGC >data set hm21r >instances seq_0,-527,TCCCTTTTTGGCCC seq_1,-979,TCCCTATTTGGCC seq_1,-403,TCCATCTGGGGCAC seq_2,-225,TCCATATACGGCCC seq_2,-179,TCCTTCTTTGGTC seq_3,-315,TCCATATTAGGAC seq_4,-100,TCCTTTTATGGCCC >data set hm22r >instances seq_0,-421,CACCTCTGTCACCTTCC seq_1,-358,CACCTCTGTCACCTTCC seq_3,-291,CGCCTCTGTCACCTTCC >data set hm23r >instances seq_0,-414,TGGTCA seq_1,-489,TGGTCA seq_2,-59,TGGTCA seq_3,-458,TGGTCA >data set hm24r >instances seq_0,-13,GCCGCTATTAC seq_1,-385,GCCGCCCTTTC seq_2,-10,GCCGCCATT seq_3,-333,GCCGGCCTTCC seq_3,-35,GCCGGGCTT seq_4,-16,GCCGCAGTTTC seq_5,-99,GCCGCCGTTGTTCC seq_6,-358,GCCGTCCTT seq_7,-453,GCCGACTTTGC >data set hm25r >instances seq_0,-150,GATCAAATTGACGTCATGGTAAAAATTGACGTCATGGTAA >data set hm26r >instances seq_0,-622,CCCACCTCCCTCTATC seq_1,-72,CCCGCCTCCCGCTCCC seq_2,-593,CCCGCCTCAGGCTCCC seq_2,-180,CCCGCCTTCTTCTCC seq_3,-293,CGCGCCTCTGTCACC seq_3,-225,CCCGGCTAACCTTTCC seq_4,-906,CCCGCCTCGGCCTCCC seq_5,-995,CCTGCCTCAGCCTCCC seq_5,-860,CCCGCCTCAACCTCCC seq_7,-951,CCCGCTAGTTCCTCCC seq_7,-60,CCCGGCTCTTTCTAGC seq_8,-563,CCCTCCTCACACTTGC seq_8,-328,CCCGGCTCCCGCTCTC seq_8,-26,CACGCGTCCCTCTCTC >data set mus01r >instances seq_0,-402,ACAGCTATTCTTCCAT seq_0,-360,AGAGTTTCCGTTCCAT seq_2,-474,ACAGCTTGCCTTCCAT seq_2,-216,AGAGATGGCCTTGCAT >data set mus02r >instances seq_2,-896,CACATACATACACACATGCATA seq_3,-723,CACATAGATACACACATGCTCA seq_7,-740,ACATAAATAAATACATACATACATA >data set mus03r >instances seq_1,-14,TGGCTTCAG seq_2,-480,TGCCTTCAG seq_2,-72,TGGCTTCAG seq_3,-71,TGGCTTCAG seq_4,-293,TGCCTTCAG >data set mus04r >instances seq_0,-622,AACCAGATAT seq_1,-442,AACTGGATA seq_1,-37,AACAGGATAT seq_2,-916,AACCAGATAT seq_4,-778,AACAAGATAT seq_5,-844,AACTGGATAT seq_5,-430,ACTGGATAT >data set mus05r >instances seq_0,-251,ATGAATTAAAAC seq_1,-479,ATGAGGTAAGAC seq_2,-232,ATGACGTCAACC seq_3,-278,ATGAGATGAATC >data set mus06r >instances seq_2,-230,ATAAGAAAGTAGAG seq_2,-167,ATAAGAAAGTAGAG >data set mus07r >instances seq_0,-985,CACGGTGCCCAGGCACC seq_3,-127,CACGGTGCCCGGGCAAC >data set mus08r >instances seq_0,-1500,GTGTGTGTGTGTGTGTGTGTGT seq_0,-1468,TGTGTGCGTG seq_0,-49,GGGTGTGCGTG seq_1,-1349,GTGTGTGTGTGTGTGTGTGTGTTTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGTGT seq_1,-693,CACCCACACA seq_1,-682,ACAAACACACACACACCACACACACACACACACACACACACACACACACA seq_2,-316,ACACACACACACACACACACACACACACACACACACACACACCCTC >data set mus09r >instances seq_1,-374,GAGAGGCAAGA seq_1,-325,GAGAGGCAAGA >data set mus10r >instances seq_0,-565,GGGTGGGG seq_0,-109,CCCGCCCC seq_0,-74,GCCCCGCCC seq_0,-57,CGCTCCGCCC seq_1,-193,GGGTGGGGGTGGGGGTGGGG seq_2,-678,CCCGCCCGCCC seq_2,-646,CCCCGCC seq_2,-593,CTCGGCCCCGCC seq_2,-543,TCCGCCCC seq_2,-73,CACTCCGCCCCGCAC seq_2,-53,CGCTCCGCCCC seq_3,-596,GCCCCGCCCC seq_3,-521,CCCGCCCC seq_3,-506,CCCCGCCCC seq_3,-483,CACCCCGCCCTC seq_3,-469,GCTCCGCCCCGTCC seq_3,-446,CCCGCCC seq_3,-97,GGGCGGGG seq_4,-129,GCCCCGCCCCC seq_4,-14,GGGGGGGGG seq_5,-667,CGCGCCGCCC seq_5,-523,CCCCGCC seq_5,-161,GGGTGGGG seq_6,-524,CTCAGCCC seq_6,-134,CACTCCGCCC seq_7,-217,CTCTGCCC seq_7,-171,GGGAGGGG seq_7,-125,GCTCCGCCC seq_7,-89,CCCCGCCCCC seq_8,-445,GGGGGGGG seq_8,-133,CTCCGCCCCCCGCCC seq_8,-25,CTCCGCTC seq_9,-175,GCTCCGCCCC seq_9,-154,CACCGCCCCC seq_9,-12,GCCCCGCGC seq_10,-669,GGGGGGGGGG seq_10,-340,CTCAGCCC seq_10,-223,CTCCGCAC seq_11,-836,CCCCGTCCCCCGCCCCCGCCCCC seq_11,-285,GGGCGGGGGGGAGGGG seq_11,-89,CTCTGCCC seq_12,-209,GGGAGGGG >data set mus11r >instances seq_0,-230,GGGCAAGGGCGGC seq_1,-256,GTCACAGGAG seq_1,-183,GACACCAGGG seq_1,-130,GGCCATTCGCGAC seq_1,-97,GCCAGTTGGGGC seq_1,-68,GACAGCGGCGCC seq_2,-242,GGCAGGTGAGGACATTGGAGTC seq_2,-180,GCCAGCAGGG seq_2,-147,GGAAATGCGCGCC seq_3,-287,GGCAGTAGAGCC seq_3,-242,GTGCAGAAGAGCC seq_4,-179,GGAGAAATGAGCCGGCACAAGGG seq_5,-496,GGCCAATGGCGGC seq_5,-403,GGCACGTGCG seq_5,-130,GACAGGGGTG seq_6,-90,GGTCAGCTGTGTC seq_7,-420,GACAGGGGAG seq_7,-176,GGCAACAGCGGC seq_7,-103,GCCAATGGCGAGCGGGGGC seq_7,-20,GGCATCGGAGCC seq_8,-104,GGCCACTGGAGCC seq_9,-214,GTCACATGGGTC seq_9,-191,GCCAGTCGTGCCAAAGGGG seq_10,-482,GGACACAGGAGAC seq_10,-391,GACAACGGGG seq_10,-273,GACAAAGGAGAC seq_11,-156,GGGCATTTGTGCC seq_11,-49,GGACAGCTGTGTC >data set mus12r >instances seq_0,-176,ATGGGGGTTTAA seq_0,-92,AAATATGTGTAA seq_1,-253,ATTATGGTGTAA seq_1,-95,AATCTGGTGTAA seq_2,-423,AATTGAGTTTAA seq_2,-260,AATGGAGTGTAA >data set yst01r >instances seq_0,-282,TTTTTTTTCGC seq_1,-293,TTCTTTTTCTC seq_2,-651,TTGTTTTTCAC seq_3,-287,TTTTTTTTCTC seq_5,-826,TTCTTTTTCCC seq_6,-944,TTATTTTTCCC seq_6,-347,TATTTTTTCTC seq_7,-521,TTTTTTTTCTC seq_8,-951,TCCTTTTTCTC >data set yst02r >instances seq_1,-418,ACCGGCGGTCTTTCGTCCG seq_1,-328,CGGATCACTCCGAACCGA seq_1,-210,GGAGAGCTATTGTTCAAA seq_2,-279,CGGAGCACTGTTGAGCGAA seq_2,-192,CGGACAACTGTTGACCG seq_3,-174,ACCGGCGCACTCTCGCCCGAA >data set yst03r >instances seq_0,-192,CAGATTCTTATTATTAAG seq_4,-427,CAGCTCCTCTATAATAAG seq_5,-110,CAGATACTTCATTATCAG seq_6,-120,CAGTTACTAGTTCATTTG seq_7,-65,CAGCTACTGACAACTAAG >data set yst04r >instances seq_1,-344,CTTTTCTGGCATCCA seq_2,-957,TTATCGCGCACCC seq_3,-678,CTTTTCTGGCAACCA seq_4,-181,CTTTTCTGGCACACA seq_6,-755,TTTTCCGGCAGAAA seq_6,-721,TTTTCCGGCAAGC >data set yst05r >instances seq_0,-217,CTAATTGGGTAAGT seq_1,-327,CTAATTAGGAAACT seq_2,-201,CTAATAGGGAAATT >data set yst06r >instances seq_5,-493,TAAGGCATCGCAC seq_6,-154,TAAGGCATCGCAC >data set yst08r >instances seq_0,-469,GCACCCAAACA seq_0,-20,CACACAAAC seq_2,-634,GCACCCATACCT seq_3,-653,CACCCAGACAT seq_4,-614,CACACAAAC seq_4,-453,CACCCACGC seq_4,-409,CACCCAGACCT seq_6,-446,CACCCAATCC seq_6,-424,CCCCCACAC seq_6,-333,CACCCAAGCA seq_7,-900,CACCCAAACAT seq_7,-437,GCACCCACACAT seq_7,-420,CACCCAGACC seq_8,-417,GCACCCAATCA seq_8,-72,CACGCATAC seq_9,-472,ACCCAGAC seq_9,-222,CACACACTC >data set yst09r >instances seq_2,-157,TAGCCGCCGA seq_3,-951,TAGCCTCC seq_4,-566,TAGCCG seq_4,-285,AGCCGC seq_4,-250,TAGCCGC seq_5,-184,TAGCCG seq_6,-732,TAGCCTC seq_6,-167,AACCGCC seq_7,-594,AACCGCC seq_7,-220,TAGCCACC seq_10,-611,AGCCGCCAA seq_11,-484,TAGCCGCCG seq_12,-671,TAGCCG seq_12,-245,TAGCCGCCGA seq_13,-857,TAGCCGCC seq_15,-826,TAGCCACC seq_15,-448,TAGCCGCCGA