Figure S5: Top motif from PosMotif1 on samples from the ABS database in Tompa's format >data set aml >instances M26179,-234,CCCCGTGACGTCACCCGGAGCCCGGGC X05831,-166,CCCCGTGACGTCACCCGGACTCCGGCC >data set ap1 >instances extracted50,-107,CCACGTAAGCATGTTTAC extracted51,-123,CCATGTAAGCATGTTTAC K00650,-300,CTGCGTCAGCAGGTTTCC M23768,-293,CTGCGTCAGCAGGTTTCC >data set ap2 >instances U32675,-77,GGGGGCGGGCGGGGGCG L06620,-59,GTGGGCGGGCGGGGGCG M26179,-202,GGGCGCGGTCGGCTGCG X05831,-134,GCGCGCGGTCGGCCGCG >data set ap2a >instances U34070,-373,CCCCCACCCCTACCCCGTGCA U36308,-437,CCCCAACCCTTACCCCTGGCA extracted15,-411,CCCCCACCCTTAACCCCAATA >data set caat >instances Y00474,-70,GAAAGTTGCCTTTTATGG V01217,-73,GAAAGTTGCCTTTTATGG X00182,-68,GAAAGTTTCCTTTTATGG M61126,-108,GGGCGTGGCCTTCTGGGG M29660,-128,GGGCGTGGCCTTTTGGGG L36125,-127,GGGCGTGGCCTTTTGGGG extracted56,-38,GGAGGTCACTTTATAAGG extracted57,-58,GAAGGTCACTTTATAAGG extracted58,-53,GAAGGTCACTTTATAAGG >data set cebp >instances M18472,-327,ACACACCCCATGGACTGG extracted46,-325,ACACACCCCATGGACTGG X76685,-420,ACTCACTCTATAGACTAG extracted48,-347,ACTCACTCTATAGACTAG >data set cets >instances AY008847,-38,AGGAGTAGAGTATATAAGTTCCAG D63333,-96,AGGAGTAGAGTATATAAGCACCAG >data set cjun >instances J04111,-45,TGACTGGTAGCAGATA X57155,-52,TGACTGGTAGCAGATA J02971,-68,TGATTGTTAGAAATTA D14461,-66,TGATTGTTAGCAATTA >data set cmyc >instances AF224272,-157,CAAGCGGTCACGTG AF224272,-137,CAACAGATCACGTG extracted29,-206,CAAGGGGTCACGTG extracted29,-186,CAACAGGTCACGTG >data set coup >instances U81851,-168,GCAGCTATGTACATGTTGGAGA M63800,-152,GCAGCTATGTACATGTTAGACA >data set creb >instances K03021,-129,ATTCCTGCGATTCAATGA M26065,-188,ATTCCTGTGATTCGATGA M31184,-200,ATTCCTGTGATTCGATGA X56849,-121,AATCCTGGGAGTTGGTGA X56850,-92,AATCCTGGGAGTTGGTGA >data set cutl >instances extracted54,-28,GCTGGGACTGTCACTCATTCTCCGATC extracted55,-44,GCTGGGACTGTCACTCATTCTCCGCTC >data set e2 >instances X00371,-376,CCAAGCTTAGAAACATGACAGGTCC extracted09,-396,CCAAGCTTAGAAACATGACAAGTCC >data set e2f >instances X57138,-89,AGAGGAAGCTGCAAGCT D43966,-319,AGAGGTAGCTCCAAGCT >data set e2f1 >instances extracted33,-63,GGCGGGCCGGGGCC extracted34,-208,GGCGGGACGGGGCC X00855,-123,GGGGGGGCGGGGCC extracted35,-439,GTGGGGGCGGGGCC extracted35,-343,GTGGGGGCGGGGCC extracted36,-300,GGCGGGGCGGGGCC extracted37,-278,GAAGGGGCGGGGCC >data set e47 >instances D88270,-236,TCCAGCAGGTGCTTCCTCCCTGAATGCTTCCAT extracted47,-98,TCCAGCAGGTGCTTCCTCCCAGAATGCTTCCCT >data set egr1 >instances U34070,-198,GCTGGAGGCGGTGGGCG M62362,-212,GCAGGAGTCAGTGGGCG U32675,-93,GGCGGAGACAGTGGGCG L06620,-69,GGCGGAGACAGTGGGCG >data set ets1 >instances S54531,-323,TGTAAGTAGGTAGGC extracted01,-326,TGAAAGTATGTAGGC extracted50,-374,TGGAAGTAAACATGC extracted51,-198,TGAAAGTAGAGATGC >data set fxr >instances AJ250902,-67,TGACTTAGGGGCTGAGCCT U00938,-64,TGACTTTGGGGCTGAGCCT AF044316,-101,TGACTTCTGGAGTCAAGGT AF044315,-102,TGACTTCTGGAGTCAAGGT >data set gata3 >instances AF377331,-111,TCAAGATGAGTAAAGATGTGGTTTCTAGATAGT L13028,-108,TCAAGATGAGTAAAGATGTGGTTTTCAGATAAT >data set gata6 >instances U72959,-197,CAGTTGTAATTAGCACCCCGGGTGTCAGCCAGAAAC S77762,-171,CAGTTGTAATTAGCACCCCAGGTGTCAGTCAGAAAC >data set gc >instances U68061,-184,GATAACCTGAATCAATATTTCC AF221746,-188,GATAACCTGAATCAATATTTCC >data set gr >instances extracted25,-59,AAGGTTACTAGTTAACAGGCATTGCCTGAAAAG extracted26,-65,AAGGTTACTAGTTAACAGGCATCCCTTAAACAG J02816,-64,AAGGTTACTAGTTAACAGACATCACTTAAAAAG >data set hif1 >instances X13323,-80,AGTGGGTGGGGCTGGAACATGAGTTC M33961,-78,AGTGGGTGGGGCTGGAACATGAGTTC >data set hltf >instances X13323,-80,AGTGGGTGGGGCTGGAACATGAGTTC M33961,-78,AGTGGGTGGGGCTGGAACATGAGTTC >data set hmgi >instances V00534,-319,AAATGACATAGGAAAACT V00534,-292,AAGTGAAAGTGGGAAATT M27481,-192,AAATGACAGAGGAAAACT M27481,-165,AACTGAAAGTGGGAAATT >data set hnf1 >instances AF051355,-224,GTTAATCAT U57552,-225,GTTAATAAT M17156,-209,GTTAATGAT M60197,-182,GTTAATGAT M11844,-101,GTCAATAAT M19524,-102,GTCAATAAT AF093878,-427,GTGAATGAT extracted19,-63,GTTAATAAT extracted18,-63,GTTAATGAT extracted25,-127,GTTAATTAT extracted26,-128,GTTAATTAT J02816,-127,GTTAATTAT U72959,-395,GTCAATGAT S77762,-372,GTCAATGAT >data set hnf3 >instances M11844,-139,TATTTGTATGGGTTAC M19524,-140,TATTTGTGTAGGTTAC X76685,-173,TGTTTGTTTTAGTTAC extracted48,-95,TGTTTGTTTTAGTTAC >data set hnf3b >instances AF051355,-123,ACTGGTGATGCACCTTTGAT U57552,-129,ACTGATGATGCACCTTTGAT >data set hnf4 >instances AF051355,-231,TGCCAAAGTTAATCATTGG U57552,-232,TGCCCAAGTTAATAATTTG M11844,-108,TGACTAAGTCAATAATCAG M19524,-109,TGACTAAGTCAATAATCAG >data set hnf6 >instances U72959,-167,AGAAACCAACAAACAGCCA S77762,-141,AGAAACCAACAAACAGCCA X76685,-124,AGTAACCTTGAAACACCGA extracted48,-46,AGTAACCTTGAAACACCGA >data set hox >instances extracted54,-28,GCTGGGACTGTCACTCATTCTCCGATC extracted55,-44,GCTGGGACTGTCACTCATTCTCCGCTC >data set hp1 >instances extracted25,-59,AAGGTTACTAGTTAACAGGCATTGCCTGAAAAG extracted26,-65,AAGGTTACTAGTTAACAGGCATCCCTTAAACAG J02816,-64,AAGGTTACTAGTTAACAGACATCACTTAAAAAG >data set hsf1 >instances extracted39,-216,GAAGACTCTGGAGAGTTC extracted39,-133,GAAAACCCTGGAATATTC extracted40,-227,GAAACCTCTGGAGAGTTC extracted40,-146,GAAACTGCTGGAAGATTC >data set ipf1 >instances S99616,-239,GTTAAGACTCTAATGACCC X04724,-217,GTTAAGACTCTAATTACCC >data set irf >instances X76685,-327,AACACCTAGAAGCTAAAGAGA X76685,-113,AACACCGAGGCCCTCATGCCA extracted48,-250,AACACCAAGAGACTAAAGAGA extracted48,-35,AACACCGAGGCCCTCATGTCA >data set m1 >instances extracted41,-183,CACAGCGGACCCGAAGA extracted41,-147,CCCAGCTGACCCAGGGA M24410,-127,CACAGCAGACCCAAAGA M24410,-91,CCCAGCTGACCCAGGGA >data set maz >instances extracted31,-415,GCGCGTAGTTAATTCATGCGGC extracted32,-223,GCGCGCAGTTAATTCATGCTGC >data set mef2 >instances extracted07,-31,GGGTTTAAATGGCACCCAGCAGTTGGCG X71910,-36,GGGTTTAAATGGCACCCAGCAGTTGGTG extracted08,-50,GGGTTTAAATGGCACCCAGCAGTTGGCG X85744,-33,GGGTTTAAATGGCACCGAGCAGTTGGCG >data set mef3 >instances X12447,-37,AGGAGCTGCCTTATAACC X04260,-40,AGGAGCTGCCTTATAACC >data set mitf >instances X16073,-309,ACTACCTCTCATTTGCAAGGTC D00439,-222,ACTACTTCTCATTTGCAAATTC >data set mtf1 >instances X15128,-39,CGTCCAACGACTATAAAGAGGGCAGGCTGTCC extracted10,-43,CGTCCAACGACTATAAAGAGAGCAGACTGTCC >data set myb >instances X75755,-193,GGGCGGGGCGCGCGGC X75755,-126,GGGTGGCGCGGGCGCC extracted17,-139,GGGCGGGGCGCGCGGC extracted17,-73,GGGTGGCGCGGGCGCC >data set myf >instances U18131,-182,GCTGTAATCACTTTGGGAGACTGATGCTCCATGACAGCTAGAAGTTGGATTGAGTTTCAGTAGCTACTATATATAAAGCTGGGTCGACTTAT M84685,-92,GCTGTAATCACTTTGGGAGACTGATGCTCCATGACAGCTAGAAGTTGGATTGAGTTTCAGTAGCTACTATATATAAAGCTGGGTCGACTTAT >data set myod >instances extracted07,-31,GGGTTTAAATGGCACCCAGCAGTTGGCG X71910,-36,GGGTTTAAATGGCACCCAGCAGTTGGTG extracted08,-50,GGGTTTAAATGGCACCCAGCAGTTGGCG X85744,-33,GGGTTTAAATGGCACCGAGCAGTTGGCG >data set mzf1 >instances S66422,-191,TTTCCTCCTCCTCC S66422,-176,TCTCCTCCTCCTCC extracted30,-201,TTTCCTCCTCCTCC extracted30,-177,TCTCCTCCTCCTCC >data set nf1 >instances M26179,-234,CCCCGTGACGTCACCCGGAGCCCGGGC X05831,-166,CCCCGTGACGTCACCCGGACTCCGGCC >data set nfat >instances extracted21,-50,TTAATCATTTC X03020,-53,TTAATCATTTC X00695,-402,TTATTCTTTTC X52618,-405,TTATTCTTTTC J02971,-55,TTATTCATTTC D14461,-53,TTATTCATTTC >data set nfkb >instances extracted21,-48,AATCATTTCCTCT X03020,-51,AATCATTTCCTCT AY008847,-216,AGTCATTTCCTCT D63333,-281,AGTCATTTCCTCT X00695,-400,ATTCTTTTCATCT X52618,-403,ATTCTTTTCATCT >data set nfy >instances M29549,-62,ATAGGTGATGAGGTTTATTTGCATATTTC M63335,-61,ATAGGTGATGAGTCTTATTTGCATATTTC >data set nkx2 >instances extracted25,-57,GGTTACTAGTTAACA extracted26,-63,GGTTACTAGTTAACA J02816,-62,GGTTACTAGTTAACA AF023131,-46,GGATACCGGTTAAAA AF025766,-38,GGATACCGGTTAAAA >data set nrl >instances extracted56,-155,TGTCACCTTGGCCCCTCT extracted57,-164,TGTCACCTTGGCCCCTCT extracted58,-159,TGTCACCTTGGCCCCTCT >data set oct >instances L10616,-176,ATCTTGAGTACTAGAAAGTCATGGATGA extracted12,-161,ATCTTGAGTACTAGAAAGTGATGAATAA >data set olf1 >instances extracted11,-299,TTGCCACAGCAATTG extracted11,-19,TGGCAGCAGCACTTG extracted22,-267,TTGCCACAGCAGTTG extracted22,-19,TCGCTGTAGCACTTG >data set p53 >instances M21487,-183,CAGCCCATACAAGGCCATGGGGCTGGGC M21390,-182,CAGCCCATACAAGGCCATGGGGCTGGGC >data set pou1f1 >instances extracted13,-299,AGTATCCTACCCTTGGAT X12967,-328,AGTATCCTACCCCTGGAT X00368,-144,AATAAAATACCATTTGAT V01244,-146,AATAAAATACCATTTGAT >data set pou2f1 >instances X00695,-274,GAAAAACTGTTTCATACAGAA X00695,-86,GAAAATATGTGTAATATGTAA X52618,-284,GAAAATTTGTTTCATACAGAA X52618,-94,GAAAATATGTGTAATATGTAA >data set rar >instances X56849,-121,AATCCTGGGAGTTGGTGAT X56850,-92,AATCCTGGGAGTTGGTGAT X74153,-297,AATACTGAGTGTTTGTTTT M16400,-295,AATACTGAGTGTTTGTTTT >data set rfx1 >instances J04718,-337,ACTTTCACTTTCGTGGC extracted42,-269,ACTTCCACTTCCGTGGC >data set rxr >instances extracted49,-352,TTCTGTATGATCTCTGT extracted49,-199,TACAGAATGTTATTTGT M29301,-315,TTCTGTATGATCTCTGT M29301,-162,TGCAGAATGTTCTTTGT >data set smad >instances AJ404961,-227,CGGCGAGCCCTGGGCAC AJ404961,-71,CGCCGAGCGCTCGGCCC AF156727,-175,CGGCGAGCCCTGGGCAC AF156727,-26,CGCCGAGCGCTCGGCCC >data set sp1 >instances extracted04,-152,GGGCGGGG X67686,-151,GGGCGGGG extracted05,-155,GGGCGGGG U43589,-102,GGGCGGGG L11910,-155,GGGCGGGG AF004877,-305,GGGCGGGG S54531,-49,GGGCGGGG U32675,-100,GGGCGGGG U32675,-81,GGGCGGGG U32675,-71,GGGCGGGG L06620,-76,GGGCGGGG L06620,-53,GGGCGGGG extracted14,-17,GGGCGGGG M13792,-199,GGGCGGGG M13792,-194,GGGCGGGG M13792,-151,GGGCGGGG extracted16,-106,GGGCGGGG extracted16,-57,GGGCGGGG X69723,-109,GGGCGGGG X00855,-127,GGGCGGGG X00855,-119,GGGCGGGG X00855,-84,GGGCGGGG extracted35,-435,GGGCGGGG extracted35,-339,GGGCGGGG extracted40,-81,GGGCGGGG AB029557,-241,GGGCGGGG M26179,-158,GGGCGGGG M26179,-153,GGGCGGGG X05831,-105,GGGCGGGG >data set srf >instances extracted04,-101,ACACCCAAATATG X67686,-100,ACACCCAAATATG extracted05,-108,ACACCCAAATATG M13631,-95,ACACCCAAATATG extracted06,-121,ACAACCTTATATG M86232,-121,ACAGCCTTATATG M86233,-121,ACAGCCTTATATG >data set stat3 >instances L05078,-231,CTCGGGGCGGGCCCGC L05078,-210,CCCGGGGCGGTGGCGC X72020,-230,CACGGGGCGGGCCCGC X72020,-208,CCCGGGGCGGTGGCGC >data set tbp >instances extracted04,-30,TATAAA X67686,-31,TATAAA extracted05,-39,TATAAA U34070,-30,TATAAA M62362,-40,TATAAA AF004877,-33,TATAAA extracted24,-92,TATAAA S99616,-45,TATAAA X04724,-24,TATAAA AF188709,-465,TATAAA AF188709,-457,TATAAA AF188709,-444,TATAAA AF188709,-27,TATAAA AF249274,-27,TATAAA S54531,-165,TATAAA S54531,-15,TATAAA extracted01,-64,TATAAA AF221746,-204,TATAAA M13483,-31,TATAAA M26773,-31,TATAAA extracted50,-31,TATAAA extracted51,-47,TATAAA Y00474,-29,TATAAA V01217,-32,TATAAA X00182,-27,TATAAA U18131,-111,TATAAA M84685,-21,TATAAA X00371,-33,TATAAA extracted09,-87,TATAAA X15128,-442,TATAAA X15128,-28,TATAAA extracted10,-465,TATAAA extracted10,-32,TATAAA extracted13,-30,TATAAA X12967,-56,TATAAA U36308,-31,TATAAA extracted15,-31,TATAAA X75755,-94,TATAAA extracted17,-41,TATAAA extracted25,-24,TATAAA extracted26,-30,TATAAA J02816,-29,TATAAA X00695,-24,TATAAA X52618,-32,TATAAA X13323,-31,TATAAA M33961,-29,TATAAA AF044316,-47,TATAAA AF044315,-50,TATAAA AB004306,-8,TATAAA J04500,-28,TATAAA X57138,-32,TATAAA X73536,-55,TATAAA M84340,-32,TATAAA AF377331,-32,TATAAA L13028,-30,TATAAA X74153,-34,TATAAA M16400,-30,TATAAA extracted49,-65,TATAAA M29301,-452,TATAAA M29301,-27,TATAAA U81851,-28,TATAAA M63800,-365,TATAAA M63800,-28,TATAAA X00368,-28,TATAAA V01244,-30,TATAAA >data set tef1 >instances extracted04,-117,GGGGCTCTAGTGCCCAAC X67686,-116,GGGACTCTAGTGCCCGAC extracted05,-124,GGGACTCTAGTGCCCAAC Z20656,-159,GGGGCCCTGCTGTCCTCC M62404,-159,GGGGCCCTGCTGTCCTCC extracted13,-352,GAGGCTCTGTTGCCCCTC X12967,-378,GAGGCTCTGTTGCCCCTC >data set usf >instances extracted56,-36,AGGTCACTTTATAAGGGTCTGGGGGGG extracted57,-56,AGGTCACTTTATAAGGGTCTGGGGGGG extracted58,-51,AGGTCACTTTATAAGGGTCTGGGGGGG >data set vdr >instances U60669,-161,CTCACCTCGCTGACTCCATCCTCCTTCCAC L04608,-143,CTCACCTCGCTGACTCCATCCTCTTCCCAC