def test_submittal_4(self): genome = "CTTGTAATCGTTCCGCAAAATGAGCATTAATTGGGTCTTGCCTTGCAACGGTGCAGCGTAGTGCCATCCTAAGCCTCGGTAATAGTCAAGGATTCTCTCGCGGTTAAGTTTAGCAATACTTGCAACGGTGAACGGTGTATGATTTCCTTCTTTACGGTTGAGTATTCTACTTGCAACGGTGAACTTGCAACGGTGTCTATTCACTAATGACTGAAGTACTTGCAACTTGCAACCTTGCAACGGTGATACGTGCGTGCGGGTGAGTGATCTCCTTGCAACGCTTGCAACGGTGAATTCGACACGATACTCTTGCAACGGTGGTGCAAGGGGTCGGGGGAGACAGCACCTAGCTACACAGAACGCTAAACGTTATTGCGTATCTGACCATAAGCCATGGGATAGCCGCACCTCGGGCCTTGCAACGCTTGCAACGGTGTAGACCAAACTTGCAACGCTTGCAACGGTGATATGACTTGCAACGGTGTGAGATTGCTTCACCGCTTGCAACCTTGCAACGGTGAACGGTGTTTGTAATCGCTTGCAACGGTGGTGTAATCTGGAGTTCCTTGCAACGGTGCAACGGTGTGAATGCGCCGATTGGGGTGCCTTCCGACCCCTCTTGCAACGGTGTGTGGAGCTCTATACGGGGGTCCAACGCCTATGAAGAACGCTTTGTAGATGAGCCTCTAACGGAAGTTAGTCCAATGGAAAATCGTAGGTGGGGATATATTGTCGTGTATATTGGTGCGTCGGGTCGTTTTTCACTAGCCATACGGATTAACCCCTCGCTGGCCCGAGATGGCGTTGGGGTTTCGGCCCCTCGTGCTGTCGAACTGGAACGGTAACTATGCCGGCCGATCAAGAATATAACTCAGAGCGAATCCAGACGCGCGAGTGGTTTACCATGGAGCTCAAAGAATCCCAGGTTCGTCCTCGGCATCCCCGATGATCAGGTGGGGGCCAATCACGTACTGGTTCTGGACGCACGCTCCTACTTATGTTCACAAGCCCAACCATTCCGTAAGGGGAGCTGAAGACGACCTAATGTGTTAGCTGTCTCATAGACGCATTCAAGCCGTATCTGGTCTGTTTCTTGTCCCTCGTGCCTGGAAGAGTCAATAGAGAGAAAAGAAAAATGCTCGAGGATCCATTCACCCTCATGCTGGGCGCGTTACCCCGGAGACGCTTCGAGGCCTTTAGTACCTTGCGTAAATCCGCCTGAAAAGCACCTGTGTTTAGTGATGTGATATGACCACCCCCGCACCTACCGTACGTCGCATCAAACTGTCCGTTTAGTGATGTTTAGTGATGTTTAGTGATCCGTTTGTTTAGTGATTACATTCCAGCTACCACGGTTTAGTGATTGTGATAAGTTTAGTGATGTCGCGCTACGTTTAGTGATTGGGTCAGTGGTTTAGTGATCGCTACCGCTGTTTAGGTTTAGTGATGTGATCATATTAGTCGTTAATCAGGGCCAACGTGGGGTTTAGTGATTTTAGTGATGAAGGTGTTTAGTGATGAAATTCCGACTTCGTTTAGTGATCAGGCCCCAGTTTAGTGTGTTTAGTGATTTAGTGATACCAAAATGCGTTTATTAACATAAACATGTGAGGTTTAGTGATTAGTGATTGATTTTCTGATAACCCTTTTCCCCAGATGGCTGAATGGCTCTCAGAGGTGGAATTCGGTTTAGTGATCTTGCAATCTCGCGAGTGTATTAAGGACCAGCTGTTTAGTGATCGGGTTTAGTGATCCTTGATAAAGAGACGCGTTTAGTGATCGGACCTTCCATCCATTCAGGCGCTGTCGAGATTGACTGACTTGGGATAAGCGCAGGACAGTTTTACCAGTTCAAGGGCATAACGTTCGAAGAATAAGGCAGACTTGGACAATACTCCTGCACGTATGCCAGGAAACGAGTGCGCTCCTTTGGGACGATCCCCACCAAGACGCACATCGGTCACCCTGGTGTCTCCAGGCTGTACTCGTGGGTTGAGTGCACTGCTATTTAGACCATGATGTGTTGTTGTAAGGTGCATGAATGAAGCGTTGTTCCTCTTACTCAGCTGTCAACCTCCTTAACCCGTAGTCACGAACTAAATCCTTTCCTGATAGGAAGTAGAATGTGTTTCAGTGTACGTGATAATAAGGCGGAGGGAGGACCTCTCAGAAAACTGTCCAGATACTTCCTTCAGTCCCCGTAATATGCCGAAAGTCGTAACCGGCCAGGCCAGCACGGTTGATATTATTAACTTTGTGAAGCATTGTGTCTAGATGCGTTGTAGAATGTCACGAGGATATTCACTTAACTCGGGCGCAGCAACGTAAGGCGACATAAAACACCTCACCAGCCGTGCAAGAGTACAAACTCCGCTCGTAGGTACCGTAATGGATAGACGTAGTTTCCCAGACATCGAGGCTGTCATGCTTTACTTCCAGATAAAGGAGACTGTGTTACACTAAATGCTTGACAGATATTATCACAGACTAGCTCCTTTGGGCGTTGCTATGCCCACCCACCCAGTTGACCACCCCCTAATTCAGAGCACTCTATGCCAGATAAGTTAGGAATTAAGCGTACGCAGAGTTGCAACCTACTCATCGCTAAGTACTCTCGACCGGGTCCCCGCAGTTGCTGCCGGGCTGCCGGTCTGCCGGTGTCATTCCTACATGCCTACTAGCTGCCGGTGTTCTCCCTCCGCGCTGCCGGTTCTAGCCGACAGCTGCCGGTGGTAGCTGCCGGTTCACGGACCTGCTGCTGCCGGTCTGTGGACGTATAGCGCTGCCGGTGGTTTATAAGCTTTATCTCGAGACCGCTGCCGGTGGAACAGTGGAGCTGCCGGTATTGGAACAGTGGAACAGTGGACGATGTCCGTTGCCCGAACAGCTGCCGGTTATTGCTGCCGGTGGAGCGCTGCCGGTGAGGAGCTGCCGGTGCCGGTCTGGGGATTAGGTGCTGCCGGTACAGTGGGGCTGCCGGTCAGTGGTACCATACCACCTGCTGCCGGTGCTGCCGGTTTAGCTTGGCTGCCGGTGATGCTGCCGGTAGTGGGCTGCCGGTGGATTGGATAGGATCGCTGCCGGTGAACTTGGATATTGGAGCTGCCGGTCGGCTGCCGGTACGAAGCTGCCGGTATAGGATCGGGCCGGCGTCCTAGCGCTGCCGGTAGGATCGGATAGGATCTCTTGGATAGGATCCAGTGAATTGTCGTGCCCAGCTTGGATAGGATCCTCAGGAGTGAACATTGGATAGGATCTTGGATAGGATCAGGATCGTGCAAGACGACAATGTGGGGTTTTGTTGGATATTGGATAGGATCGATCTTACAACCAGTGCACTGGGTTATTTGGATAGGATCGGATAGGATCTCGAGCAATCTGGAGGATCGTGTAGCTGAGGATCCGGTTGTTGGATAGGATCGGATCCGTTGGATAGGATCTTGGATAGTTGGATAGGATCATAGGATCTTGGATAGGATCGATAGGATCTACGAGAAGAGCACTTTGAACTGTGACTCCACACGAGTCAGAACGCGCGGCAAAATGTCTGTATAGTCCAGATTAGGGAAGCGCGGGATTGGAACGGACAAGAGTCATGCAGACTGCGCCCTTTAACTAGTGAGCAAAAAAGGGACCTCTATTACTGCACTAGCGGTGCCACATACTGTGTCGCCTTGCCGGGAAGGCGTCGCACGGACCGCCGTTTATGGATCCAGCCTTTTGTGGAGTACCGGCTGCGTCTCGTCTCCTTGTATCAAACCCCTAAACTGCACTTCGCTCAGACCCTTGTAATGTCGAATCCGTACACGGTCCCCAGGAGGTGCCCCCATAAGAAGTGAGCCCCATTGCGTAGCCCAAGTAGCTTCTTATATGGAAGATACGCTCGGGCAGGATATTACGCGCGGCCAGAGGCTGTCGCTCGGGCAGGCCTCTGCTTGCTAACGTACCGCTCGCTCGGGCAGGGTCGCTCGGGCAGGGCAGGTGACGCTCGGGCAGGTCGGGCAGGGCTCCGCTCGGGCAGGAGGCTCGCGCGCTCGGGCAGGCGCTCGCTCGGGCAGGGTTGCAGACGCCGCTCGGGCAGGCCTTCACGCTCGGGCAGGAGACTGCGCTCGGGCAGGTGCCGAAAATTGATCGTACCTTTGGGGGAAGACTCCTAAAATTTTGATCTTCTCCGCTCGGGCAGGGTGACCGCTCGGGCAGGAAGCTGGCCGAGTTCCTGGTCGAGGTGGGTTCGCTCGGGCAGGGACCACGCTCGGGCAGGCGGGCAGGCCGTGTCTTCGAAACTTCCACGACTACTAACGCTCGGGCAGGGACTGGGAGCGCTCGGGCCGCTCGGGCAGGCCACGCTCGGGCAGGGTATTGGGCGACTGCGCTCGGGCAGGGCCGCTCGGGCAGGCGCTCGGGCAGGCATCGCATATGGCCGCGCCCAACACCCCTATATTATTTTGCTCGAGGATGCCAATGACCATGTCCGAGCGTTAGTGCAAGCCAGTAGCATTTGCCATCCGCTGGACACAGGCATCGAATTAATGGTGCGCAAATTGAGGTTAGTTCTTCACTGCTGCGAGGAGGGTGAACACATATAGACGGTGACGGTAGGGGTTATGCCAGACGGTAGGGGACGACGGTAGGGCGACGGTAGGGGGGGCTAATTTCATAGACGGTAGGGGGTGACGGTAGGGGCCAGGTTGACGGTAGGGACGGTAGGGCAGTGTCTTGACGGTAGGGAAACGACGGTAGGGAATCACTTGCTGCCGCCAACTAGCAACGGAGACGGTAGGGACCGATAAGGGTCGCATTGTAGGCTAAATATCCTTAGAAACAATGACGGGACGGTAGGGGGTAGGGCACACACTAGACGGTAGGGGAGGTTGACGAGGTGGGACGGTAGGGACGGTAGGGGCGTCGAGTGACGAGACGGTGACGGTAGGGGCAATGCATAACCTACACACTTGACGAGTGACGAGGTGGCGACGGTAGACGGTAGGGGGTAGGGGGTGGCCGAGGTGGCTGACGGACGGTAGGGGCCATGGGCACTAGAGTGTTCGCGGACGGTAGGGTCGGACGGTAGGGTGTTTGTGACGAGGTGGGACGGTAGGGTAGGGGGTGGTGACGAGGTGGCGACGAGGTGGCACGGACATCACCGGAAGGAATCCCCCGAGGTTCCCATTAGCGGGACTGTATGGTTATGTGCCCCCAATGGAGGATGACGAGGTGTGACTGACGAGGTGGCGGCAGCGGCATATCTCACTTCAGATTCTATGGCATTGACGAGGTGGCAGGTGGCGTGACGAGGTGGCGGTGGCACCTGACGAGGTTGACGAGTGACGAGGTGGCCGAGGTGGCGATGACGAGGTGGCGGTTGACGAGGTGGCTTAGGATCCGCTCTCCTGCGTCCCGAAGACGACTTCAATTGCTACAGTCCATTAGATTTGGTAGTTATCCAAGCGCGAATGCTAACGGTCATGTACTACCATGAAATATGGTGCTTTAGGGAGCACGGCTTCCGTCTTCGGTGGAGGGAAATAGAATTCCACTAGCAGGGAGCTGGCGACTGAGTGGATACAGTTAGTACGGTCCGGGCCGTGCTTTGAAGATGGCCGCCTATCCCCTACTACGGTTAGGAAGCCCGATCGCTGAGTCATCGTCGTGAACGTGGCATACTCTGCACCGCTCAGCCGAGTTATCGTCAAGTTCAGATCTATGGACGAACGGGTTCCCTTTCTACACTACGATTCTGTCCGCCAGTCGTTCATGTACTATCAAATCACACAAAAAGGTAGAACGCCTGAATCAAGAGCGCTTCTGGCAAGATATCTTAAGTGCTTTGAACTACTTGTACAGCCCCCCACTCAATAGGGGTTTATTCGTGGCACTTGGAGCCGCCGGTATATAGCGATACACTCGTATAAACCGGTAATGAAACCCGCCTTGGGGCATTAGGCCATCATTATATGGGAACTGTCATGGGCCTTGCAACCCGACGGTTAAATACTACGTCACAGTTCAAAACGGATTTTAGCGGTATAGTGCGCTTTACCCCTACTTACAGCACCCCGCGCGGGTCGAGCGGCAGCTTGTAGCGCGGAAGATGCTCGATTCGCGACGACAGCTGCTATGGACTCCGCCCGCCTGAATTCGAACAGGAAACGCTAGTTTGGAGCTAGGGAGTCCCTGAGTCGAACGTAAGCATTGTGCGCACCACTTAGTTGCACTGGTGACCAGCCCGACATTATGTTAGAGGATCCGCATACACTAGTTGAGAAATTCTGCTGCTGCTTGTTTTATGGATGAAGGAGTAAGGGGGAAGCGAGAAGCACGATAGCAGAGATGCCGAGTTATTGTCAACAGTGAATGTGTTAGTCCGCATCTCAACACTATACTACTGGGTGCTGCCGGAAAAGCTTGTACTTACAGTAGAATATTATTGAGGCGCGTTTGATTGTCGGTAGAGGCATAAGCGATTGCATGTCGTAGTGTCCGGCTGTCCGCCGATAGTCCACCACTGCTAAACAAGGCAAGTATTGATGTCGAAACGGGCTATATAACATGACTTAGTGCCTTCAAGTTTGGTCGATATCCCACCTGCCGACGACAATTGGCCAAAGGGACCGCGCCTCGCATAGGTTGTCACCCGCGTTCTCAAAAGAAAGGTGAAAACCTCAGATACCCCACAGCGTCATGCTCTCTCTGCGTACTGTGAGGCTAATACAGCCCTTAGAGCGTTCCTCCTCCTCTACCGCGCGTCGCGCTAACCCCGAACTTCAGTAGACAAACCGACGACGACTTGTCCGGCCGTAGAAACGTGAAATGCAGAAGTCGATCTATGTAGCAGCGGCCTCAGATATACGTTCCGCTAATAGGCAGCCCTACAGTCGTGGGAGATGAAGGGTTGGCCGGGCATTCGGATATATATCCATCTCTGGTCGTGTTGTCAAAACTAGGTGTTACCGGTTAATCGCATTGTTGTATCCGCCTTAATGACGCGCGGAAACTTGCCCTTGCCAGAACACTGTTGGCTATTACTACACGAACTACGAAGTGGGTCACATGCGGGAGGCTTAGACTGTTTTGTTGGTGAGGGCGGACCTGGTTGGAGACGATGAGTAGCCACGGGAGACGAGGAGACGATGCACGAATCTGTCGAGTAATCGAGTAACAATGAGGATCGAGTAACAATAGTAACAATAGTAACAATATAGTCCCTCGAGTAACAATAGACGATGGACGATGGACGATGGCGAGTTAAACACAGGGGTCCTTGGATAATAGGAGACGATGTGAGCCCTCGGAGCAGGAGACGATTCGAGTAACAATATCGTCGAGTAACAATCGGACACGGAGACGGTCGAGTAACAATGGAGATCGAGTAACAATGTAACAATGGGAGACGATGTTCTTCGAGTAACATCGAGTAACAATGTTCGAGTAACAATTTTCGTCGAGTAACAATAATCGATGTCGAGTAACAATCGAGTAACAATAGAGGCCTGAGTCGAGTAACAATTACCGCGGCCTGACCTCAGCGGGTGACGGAGACGATGGGGAGACGATGTCGCCTCGAGTAACAATCGAGTAACAATGACGATGGGAGACGATTCGAGTAACAATGAGACGATGTCGAGTAACAATTCGAGTAACAATTCGAGTAACAATTCGAGTAACAATAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGAAAGAAATGGA" clumps = find_clumps(genome, 12, 542, 18) self.assertEqual( "AAAGAAATGGAA AAATGGAAAGAA AAGAAATGGAAA AATGGAAAGAAA AGAAATGGAAAG ATGGAAAGAAAT CGCTCGGGCAGG GAAAGAAATGGA GAAATGGAAAGA GGAAAGAAATGG TCGAGTAACAAT TGGAAAGAAATG", " ".join(clumps))
def test_find_clumps_with_sample1(self): genome = "CGGACTCGACAGATGTGAAGAACGACAATGTGAAGACTCGACACGACAGAGTGAAGAGAAGAGGAAACATTGTAA" clumps = find_clumps(genome, 5, 50, 4) self.assertEqual(['CGACA', 'GAAGA'], clumps)
def test_submittal_2(self): genome = "TGGACACACACCCACTAAGATAACGCTGTGCGAACGCTGGCTAGTGACAGAACACATGTACACACATCTGAATGATAGCCATATAGCGTTAGGAGGCTGCTGCCCCGTGGTCATGATGTACACTCCCCCAATAATGCGAAAATCGAGGCCGGCTCCCCCTCAATATTGTCTCTCTAATCGCGGAGCAGAAGATCCCGGCTCACCTACCGAATACGTACAAATCTGGCGAGGACATGTGCGATGAGTGACCATAATTCAGGGGATCTTTGGGAGTCCGATGACATTCCAGTGGGCCTTATGCCACACGGTATGGGCCCAGGTGATCATCACCCAGATTGAAAGTCGATAACTTATCTCCAGAACAGCGCCTCTCAACAGCCCGTTGGTCAGCCGTCTATTAGCCCGTCCGTCCGCTTTATTGTTACGGGTGCGACTCCGGGCAAGGCCGCGCGTCCAGAGCAGTCTGGCTGGCGGCAATACTTAATAAACCAGAGTCCATTTCGAGCGTACTTCTAGACTTTTCGGCCGCTTAGTGTCTCCGCTGTGCTTAGTGCAAGCATCGTCCCAGTTTCTCATGTAGCGACAGGATGAGAGTACATCCTAACAAATTATCTAAGATGCTCCACTACCCACGCAGTCACTTGTTACGATTGTGCGTTATAGGCTCTATTATCGAAAGGCCAGCCGCGTGGCAAAGTGTACCGGCAAGGACAACTCTCTGCTCTTCAGGCTAAGTGTGCCTTCTGGTTGTGGACGTCTAATTATCAATGATTGAACGAATGCGACTTGCGCGGATTATCGACGACCGGAGGGATGTACGGAGTCCATCAGCGGATAGCGCCGCCTCCGATGAGCGACTACCAAGACGCCTGACCATTCATTGTAACGCCCGGCCAATAGCATTCGACACGACCTGGTGTAGGACATTAGCTCCGTTTGTAGCCGTCCCAGGTTCGATAAGCTGCTCTAGGCTGCGATCTGAGGTGGAGCAGATACTCGGACATCGAATTCATGGAGCCCGAAGCTCCCGGACGGGTTATATACAGGAAAGCGTGCACCATCTAGGAGTTCTTCTACTCAATTAGTTCCACGTGATCAGTCGAATAGAGCCAGATTGTCGAATTCCGGTTTGTATTCATCCTTGCGTAATAAGTGTTTAATCGATACCCCATGCAAGTGGTATACGGGGAATCAGACCCGACCCATACGCGGTGTGGACAAGCTATCTTTGACCTAGAGTGCCATTGTAATGCCGAAAGCGAAGAAAACATTTATTATACAAGTTAACCGGCACATGGTACCTCGCGAGAGGAATAAGCCGGTTCCATAGTACGCAAGGATTTAACCCAATCCGGCCGTTGACCTGAGGTAGGGTGGCACTTGTCCGGTGGCCCAACCTGAGCGCTACTCGAAGTTGCCAACTCCACAACGAATACTATCCCCGGGTTGCGCGACATTTTCTGACAGCATGTCTTTTACGCACCACATCCCTCTCACACACACATCCCTCCACATCCCTTCGGACGGCACATCCCCACATCCCCACATCCCTGGGATAACTCCCGCACATCCCTCTGAAAACGAGAGGGTGAGCACATCCCTCATCCCTTTCCCTTTCACATCCCTGAGTCGCCGGCCACATCCCTACCACATCCCTTGAGTCGCCAGTGAGTCGCCTCTCAACGATGTCACATCCCTGTCGCCTGCACACACACATCCCACATCCCTAGGACAAACACTTGCCAAACAGTGCCACACATCCCTCCCTGGATGTGGTGAGTCGCCTAGTTGTGGTGCGCTGCGGCGGTGAGTCGCACATCCCTTCATGTCACATCCCTCATCCCTCGCCTGAGTCACACACATCCCTAGCCCAGGTGAGTCGCCCTCACCACTGCCCCTCGTGAGTCGCCTGGAATGCACATCCCACATCCCTGAGTCGCCGTCGCACATCCCTCACATCCCTCCGCCGGAGTGAGTCCACATCCCTTGTGACCACATCCCTCTAGTCGCCTACGGGTTTGTACGCGGGTGAGTCACATCCCTACTCTAGTCCGGGTGAGTCGCCCTCATAGTGAGTCGCCCCCACAATACTAACGTGAGTCGCCGCTTAGACCCTAATGTGTGCGGCATTTACTAAGGCCTCCTACTTGCGTTATGGTCTTTTACCCTCCTCAGTTAATCACAGACAGTTCCGGGGCCGAAACTCATCAGGTGACCAGAGGCAAATCACAAGTAAACCCCTGATCTAACAAGTGCGGAGTCTGCTCACGTAGAATGCTTAAGTTCCCTTCAATGCTCAAGTTCGGATCTCGGTTCTTGGGGCTTATTGATGTAGAATTCGATCGAAAGAACTCACCAAGGCCTGCCACAGTCGCGTCATCATGGACAAGCCACGTAGGGTTTGTAAGGGTACGGTTAGCCCATTAAGTTTTGTTGCATTATAATGCATTATAACCTGATAAATACAAGAACTGCATTATAATCCACGGATCATAGGTGTACGGTCCCGCTCGATATAGTAACCGCGGGCTGGGCTTCATGCATTATAACTGCATTATAAGGGTCAACAGTTCTCCGCCGCGGGCTGAGTGTGCATTATCCGCGGGCTCCGCGGGCTTTATAAATACCGCGGGCTAAGTGGAGCCGTTACCGCGGGCTGCGGGCTCCGCGGGCTATCCCGCGGGCTCATCCGCGGGCTCCGCGGGCTGCTCCGCGGGCTCGTGCATTATAAGCATTCCGCGGCCGCGGGCTAATCATTGCATTATAAGTGCCGCGGGCTCCCCTGGCCTCCGCGGGCTTAAAGTGCCGCCCGCGGGCTATGCATTATAAAATGCACCGCGGGCTGCTTTATAACATTATAATCGCCCGCGGGCTACACTTTCCTACATACACTTTCTTTCTATAAGCTACACTTTCAGGGGCCCGCGGGCTTACACTTTCCACACTTTCCTACACTTTCTTATTACACTTTCTCGGGTAGAGCCGCGGGCTATTACACTTTCGAAATACACTTTCTCTCTACACTTACACTTTCACTTCACGCTACTACACTTTCATTACACTTTCTCCACGAATCCTCTATGAGTTACGCGGCAAGTACACTTTCTAAGGCAAGAGCAAGATAATAAGTCGCTTAGCAAGATAATGCGATGCAAACAAAAATTAAGGAGTACACTTTCGGCAAGATAATACACTTTCAATATCAAAACTAAAGCTGCAAGATAATGAGGACGGTACACTTTCTAATGTATGCTACGCAAGATAATACACTTTCCCTCGCAAGATAAGCAAGATAATAGGCAAGATAATAGCTTTCCGCTTCATCTTTTACACTTTCCATACACTTTCTACACTTTCTTCACTTTCGCAAGATACACTTTCCACTTTCGTGTTCTACACTTTCTGCTCGCACTGCGCAGGCTGTACTGGTTGCACAGAATAAATGAGCGAGACCCACGGTACTTGTAGAAGTTGCATATGCGTCTGGACGTCGCTTTTCAGATGAGCCAATATTGGAGGTAGAGCAGTTTTTCAGCTAGCCTGTAGCGAAAGGTCCCCGCGTCAGGGGCTATGCGCTAGGCTGGACAGTAGTGGTGACGATCCGCGCTTTGTCATACCTTCGCGTGGAGAGCAGGGGACTCTGTTGGGCAATCCTGGATAACGTTCCCTGGGAACATCTTAATTACGCATGGAAGTCCGGTATACGCGCTGGCAATGTACAATTAGGCAGACCAGCTCAGAGGCCACATCCGGAAACATCTGATAGGTTTCCGATCAGACGAAACACCACCGGTCGTGCTGGGAGATAGGACACCGGAGCAACTGCCTAATCCCTCGAAGGGTTTTGCCCACGCCACTATTATTACCCTATCTGTTCCCTCTGGATACTGTACTATGGTATCTTCGCTCATTTTCCGTGGGAGGCTTCGACTATAGGTCGGAGTGTAGCTAGCATTACTTTAAATACACGTTTGAGGGTTTAGGTCGTGCTCCGCGCGTTTTTTTCGCAGTCTGCCATGTTTTGGCTTCCACAGTACATTCCCTGGTCTACCGATGCGCTAAGTTATTACGATCAATGCGAACGTGTGCGTGCGGTTTTAGCCCGCAATACTCTGTCTAGAGTCGGCCGTTTCTCTAAACACTCCGTCGCGCTACCTGAATCTAGACAGTCCGTCGCGCTATGCGCCGTCGCGCTAAAACCGCCCCGTCGCGCTACTAACCTACAAGACCGTCCGTCGCGCTACGTCTGCGCCCGCCGTCGCGCTACTACTCCGTCGCGCTATTGCTACGTGCTGACGTGAGCCTCCGTCGCGCTATCACAGCCCGTCGCGCTATCGCGCTAAGGCACCCGTCGCGCTACCCTGGTCGGAAGGGGCCCGATGCCGTCGCGCTACACATACCGTCGCGCTATAACTCTATAGGAGGCATCGACCGTGCACAATACCCGTCGCGCTAGTAAGACCTCCACAGTAGACCGAGGCCGTCGCGCTAAGACTACAGTGGTGATGCATCGATTCGCAACTCGCCGTCGCGCCGTCGCCCGTCGCGCTATTACAACGCGGACCCGTCGCGCTACTAAACCGTCGCGCTACCCGTCGCGCTATTGTGAACCGCCGTCGCGCTACGGCCGTCGCGCTACTAGTCTTACCGTTTACATCCGTCGCGCTAACTCTGCCTTAGTTTGACATGAGTCTACCGTCGCCGTCGCGCTATCCTCAAGAGAATTACAAACCTAGTCTGGTGGAGATTTGATTCTAACCTACCTACGGGAGTACTGGACTCAGTGTATCCTAGCCTCCATGTGACCAAGTAAACGAAGGTGTGGAACCTTCACGCTACCCACTGTACACGTTGAGCATCAGCCGACTTAGACTATTCTCTTAGAAGACATCAGTTATGTAGATTAGTAGTTTACGGTGACTGCACCCATTAGCATCTGGAGGGCAGTTATATCACAAAACGCTTTAACAAAGCTTCGGGCGTGCGATACGTCTCCCTACGTACGTGGAGAATCAGTACCTTCGCATGTTAAAGGCAACTCTCCGACCTTAAACCTACGTCGCGTCGTCTAGCGATCTGGGTATACGTAATGCGGCAATACTCAGCTAGAGCTGCACAGGTACATGCAGTTGACGCGAGCGTTTATTTACATTTTTAGGTTGAGCATCCTACACTATTCGGGATGCTAGAAACGGGCGTCTGCTAACTCAAGCCATACACAGTATATTTAATAGTTTGGCATACCTACAGGACCCAGTAATGCAATAATGGAGAGGCTGGTGGGCCCTGAGTTTTACTGCCTCACTGTCTGCACGTACCAGATTGAGCCTCTATACTCTCCATCATCTCGTCAGAGGTTGTCGTTTCTTACTCTCAACAATATGATTACAACTGCATGCACATTCCATCATCGTATGGGAGACATACGGAGCAGGGCTGTGTTGTCTCCTTTCCATCATCGGTCCATCATCTCCATCATCCTAAATCCGCTGTCCATCATCTCTGATCCATCATCGTGCCAAACGTCCTGGTACCGCATGGTTAATGAGGCTTATTTGTGTAGATCCATCATCTCCATCATCGAAGCTACTTAAGACCGGATTCCATCATCTTTAGCGAGTGGCTTCCATCATCTTATTCCATCATCTGTTCCTCCATCATCTTCCATCATCAGGGGCCATGTATGCTCCATCATCGGCTTTCAATCTCGAGGGCCAAGAAGTCCATCATCTAAACCGTCCATCTCCTCCATCATCCGGTAGGAAGTGTTCCATCATCCATCATCTCCATCCATCATCAAGCGTCCATCATCACGTCTCGTCCATCATCATCCTATCCATCATCCATCCATCATCCATCACTGTTCCATCATCCCTTCTCCATCATCCGTTTCGAAAGCCTCTTTTACAGCGACTTTACCAGGCGCTGACTCGCGCGGATTAATATCCCCCAGCTAGTTGACGGGTACGGGGAAGAGCTACCCTGTATCATCCTGCCCCCAACAATCAAACAGCGTACGACTCGCGCACAACATAGCGTTAAGAATATGGCGATCCGAAGCGCTTTTGGTGTCGCCGCATTGTTCGTGAGCCTCGAGTGTCGCCGCAGCGTGTCGCCGCAGTCGCCGCAAGTGTGTCGCCGCATGTCGCCGCACAGTGGTATGGGATTGTGTCGCCGCAGGTGTCGCCGCAATAGCGAATTAGGTGTCGCCGCACTCGTGTCGGTGTCGGTGTCGCCGCAGCCTGGTGTCGCCGCAGTGGTGTCGCCGCACGCAACCGACGCTGGTGTGTCGCCGCAACGTCATACTGCACATGTAGAAAGGAGGTGTCGCCGCACCAATATAACTACTTCCGACTCAGTGTCGCCGCACAGTGTCGCCGCATGGTAAAGAAAGTGCTCGGTGTCGCCGCATCGCCGCAAACAATTAAGTGAGAACGAGTGTCGCCGCACGCCGCATCAGTGTCGCCGGTGTCGCCGCAGTGTCGCCGCACGCCGCAGCGACCTCAACTCGGTGTGTCGCCGCACTTCCCTGTCTTGTGCTGCCAGGTGTCGCCGCACTGTCGCTTCTGTAAGACGCGGGCAGCAACCAATTCGATATTCAATGTGTCGCCGCAACGTAATGGAAACGGACTTAGGGATCCCTGCAGAGAGCACTTTCAACGAAACTTGAGCTTACAACGAGTCTGTATAGCTGTGCCGGTAGCTACAGGTCGACAGCCACAGTGGATTACATTGCTCCGGTACATTCGCAGTACAGGACATGGCAACGGGGGATATTTTACAATTATAGCACGTTCGTGGCGATGCAGGGGTTGCACGTATAGAAATGGCAGATCAGGACCGAGTAAGCAAAGTTCAGCGAGACGTAGAAATGATCAGTTGCTGAACATCGAGCAGCTGAAACCCACGCCCACAGTCAGGGCGGGACGCGACGCGAAAAGCTTACAGGTTGAGTTCCAATGGGCTACTAAACGGAAATTACCAGAGGCTCTAATCAAAGCGTTGTCCCTACATTAAGTCCTTCGCCGAGGTTCAAATGACGGATGAGCACCTATGGGTACAGTCGAAGGAGGTTTGACGCGGCTTCACGGGCGAAGGCGAGCGCCACCTCCCAGTAGTTACAAGGAAGGAACCTGCCCAGTGTTCTATGCTAAGCGAAAAAAAAGCCGAACCAAACCTGCCGGAGCCGCGGTCCAAGCTGATAGGGCCTGCGATCTATACACATAGCTCACTAACCTCTATACGCTGCCGACGCTCTCGCCACGCAATTTGTGCTATGTTTGGTAGAGGTAGCACATGGTGGCATCAAGCACCTGCGTTCATCGGTGGCATCAAGTGTGGCATCAAGCTCATTATATATGACGTGCGATGAAATGATCGGCTTGCGTGGCATCAGTGGCATCAGGCATCACACTATACTGCCAACCGCAGCTGTGGCATCATTAGGTGGGCCGTGTGGCATCAACAGTGGCATCATCAGCTCAATTAACGCGTGTGGCATCACATGTGGCATCATGTATTTTTAGTTCCAATAATTAGTTTAAAAGGTACGGAGGTTGGGCTGGGTGGCATCAGAAGTGGCATCATGTGCCCAGCAAAATTCCAGGCATCACGTGGCATCACAGCAAAATTCAAATTCGGCTCTCTCAAACCGAGTACGTGGGAGCAAAATTCTCAATTCGTTGTTGAGCAAAATTCAAGTAGAAAGCGGCTCAAGCAAAATTCAGGTGGCGCACGAGCAAAATTCGGCATCACATCAATGTGGCATCAGTGGCAAGCAAAATTCAGAGCAAAATTCAAAATTCAGCAAAAGCAAAATTCAAATTCAAATTCAGAGCAAAATTCAAAAGCAAAGCAAAATTCTTCTTCAGCAAGCAAAATTCAATTCAGCAAAATTCAGCAAAATTCAGCAAAATTCGCAAAATTCAGCAAAATTCAGCAAAATTCAGCAAAATTCAGCAAAATTCTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATTACCATCGATATTTACCATCGATCCATCGATTACCATCGATTACCATCGATTACCATTACCATCGATGATTACCATACCATCGATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCGATTACCATCCATTACTCTTAATTCATTACTCTTACCACACATTACTCTTAATTACCATCGATTACCATCCATTACTCTTAATTACCATCGATTACCATCCATTACTCTTATTACATTACTCTTACATTACTCTCATTACTCTTATACATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACATTACTCTTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATCATTACTCTTATACTCATTACTCTTACCATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACTCTTACATTACATTACTCTTACATTACTCTTA" clumps = find_clumps(genome, 11, 520, 19) self.assertEqual( "ACATTACTCTT ATCGATTACCA ATTACTCTTAC CATTACTCTTA CCGTCGCGCTA GTGTCGCCGCA TACATTACTCT TCGATTACCAT TTACCATCGAT", " ".join(clumps))
def test_submittal_1(self): genome = "GGTGCGTAAATCCTGGGTGTACCCAGAGCCGGCTATAAGGGAGTATCAACTCACCCGCGCAGCCGGAGACGTATATTCCACTTGAGTACAACAACCCGTCGTCAGGGAGGAGACTAGCCTCCAGCATCTTCAGGTTTCGGAACACCTTCCGTCGTAAGCCAAGTAAGATGGTTAGGGACCGGCTATCAGACGCCCGTCGGGGAAACGTTATTATCTACAGTGTTTACCTAAAACGCGTGACGCGGTATACGTCCGATATAGAGTTGAACCGATCTAAGATTAGGGGGTATTAATACGATGAGCTTCTGAGCGTTTCGCCATCGAATGTGAGTAGTTAGCTCTATAAAATCTAACTTCGGGCTCCATGATGAGTTTCCATCGTCTGCAGGAGCTATGGGGCTAGAGTTAAGAACTTATTCGGGAGACAAGTAATTTAACATCAAGGGGCATACGAGTAACTGTAAATTCGCGATTTCGCGATGCGATTCGCGATCGCGATCGAGTAATTCGCGATATTTCGCGATAATAAGTTCGCGATCGCGATGATCGATTAAGGGATCCGTAAGACGAGTAAAGGCCACCCGACCCTCCCGCTTCGCGATTCGCGATGCAAACGAGTAAAGGACTAGGCGTACGAGTACGAGTAAATCCTGTGACACGAGTAACGAAAGAGCCACCCTGGACAAGGACGAGTAAACGAGTAAATCCTTCGCGATGCGATTTTCGCGATAACCATCATCCATCATCCGTAAGGTTTCGCTTCTTCGCGATGAGTAATCCGTAAGGTAACGAGTTTCGCGATGGTAAGGTAAGACGAGTAACGAGTAACCGTAAGGTTCGCGATCATTCGCGATGGTTTCGCGATGTAAATTGTCGAACTTCGCGATGATCTTCGCGATTTAGGAGTTTCGCGATGCTGTGACGAATCGAGTTCGCGATTCCGCGACGGTCCCTAATTCTTCGCGATGTCTCGCGGGGTTCGCGATCTCGGGGTAATATACTGCTCACGCGGACGCCGATGTTACCTCGGACACCCTCCGATAGGATTTACCGTCCTGGACAGACCGGAGTTACTACATCGACTCCCCGCGGTCACACCACAAGATAAATGCGACCCTACTAGCGGGCATTGTCCGTTTCACGCCCTACCGTTCGTAACGACGGAGATCTTCCACGAGCACCTGCTGTGTCGCTAGCAGGCCTCAAAAAGATCCCCGCTCTCCGCAGACGTAGGACCGTACAATGGCTCCAGTGACAAATTTGGTCAAATCGGAAGTTTTCTCCCGATCAGGTGGAAAGTACTGTCAAGCACGTAGCTTTCAGTAGTGACACATTATATCTAAAGTAATGCAGTTAACCCTACCAGGGTATACGGCGAGCTGAAGCGTTCAGACACATTTTCAAGTCAACAGGAGCTGGCAAGATGTTTTAGCAGTTTTATGTACTAGCTTGAACGAATATCATGACGGGTATGAGACTACACGCGACATAAAGTCGCCGCGTTATAGGCTGGCGTTTAAAAATTTCGAAGGGTTTGGCCTTCATTGTGGTTCATTTAGAGACAGAGAGACTTCTGAGACCGGTACTCAAGCAGTTTAGTTTCTGAATCAGAAGTACGCCCTCGAGATGACGTCGCTGGGTCGTCACCAATCGCCCTGAGACCGCGCTGGACCGACGGTCTCGAGGAAACATCACCAGAATAAATTTAACGCGTGAGATGCGCATACCTTTCGCTAAGAAAATCGCAGAGTGACCGACACTACACTATTCTACAGAACCGCGACACTAGCGATACAATTAAGAATTAACCATGTGTCTCAAACCATGATGCTGATTCGACACTACCTCCCAGCCGACACTACTCCGACACTAGCACCCAGTTGGTTTTAAAAATTCGGACGACACTACTACTTGCAAGTATCATTTCGACACTAACTTGTTCTAAGGACTCGTATATTACACCAGGGAGGGACTTGATCGACACTAGGGGATTGCCTGCTCGACACTACTACGACACTAGACACTATATCGGCTACGACACTAACGGTGTATATTTTCCCCGACACTACGCTCTTACACCGATCCTAGGGTTACGGCCTATCGACACTATAACTCGATTTATCTGCCGTGTCGACACTACGCGACGACACTACCCAAAGGGGCGACACTACCGTCGTTCGGCGACGACCGACACTATCCGTATGTCAGATGTACCCCGACGACACTATTTGCGACACTACCCGTCCGACACTATGGTGGTCGAGCGACACTAGAGTTAGACGGGTGGATCCCCAGTAACGCGCAATCTCTATAAGCCGGCGGTTCAAGGTGCATGATAAAAGACTAGGCTCGGGGCTCTAAGCCATGATCGTCGCTTGCATACTGAAGCCGTAAACACAGGTATACGTTCCACATGGTTTCCCACACATTGCAAGTTCTGAGGAGCAATATGTCGCCTCCGTTAGGCCCATCAGAACGATGTTTTATACTACTTAACATGTGTAGAGAGCGCTCGCCGGAGGGAGGGACCTATGATCTTGAGGGAGGGACCTAATTAGGCTGGTTCCTGTTTCCCAACTCGCGGCGAGGGACCTACGCATTACGTGCAGACTGCTGTACGGGGAGGGACCTAACAGGGCGAAGGGAGGAGGGACCTACTTGCGTTTAACTGTTCCAAACGCCGTCTAGGATAAGGAGGGACCTAGGGACCTACGAATTCCTTCCGAGGGACCTATGCTTCTAGAGGGACCTAGACCTAACCTACCGCGGAGGGACGAGGGAGAGGGACCTAACAATGAGGGGTACACATAATCCGAGGGAGGGACCTAGGTCGCGGATGAGGGACCTATAGTTGCAGTACTATCCGGCATGAGGGACCTATCAAGAGGGACCTATATGTGTGTAAAGAGGGACCTAATATGTCCCGGGCAGAAGGTCTGGTGCTCCTAGCCGTGATTTAAAGAGGGACCTAGAAGAGGGACCTACCTAAAGAACCGTTTTGAGTTTGGAGGGACCTAAGCTGAGGGAGGGACCTAGGAGGGACCTAACTGTACAGGACTCGAAATCCAAGGGACCTCAGTACCCCGTGCATGCTAGGTCGTATACGTCCACCTGTCCCGGCTTACGACACAGTTAAAGAGAAGATTACGTAACAGCGTAATTGCCTTCGCACAGAAGTTGTAAGGGGTAACGACCATGAGCTACGGTCGAGCTGCATATCATACCTTAACGTTTCTGATGCCTATCCTCAGGTACGTGCCGGCTGCAACAAAATTTCGGTAACACCTGGCAATGCTAGTGATCAAGTCTAAGCTATCACACAGGCACGGCCGCCGTCCACGTTGTGTGGAAGCGGGATAGGGCGGGGGGTGGCTTGGCCGGACCTTTAGGAGGGTAGAGATTCTCATTAGGCCCCCGCCATTTAGAACAGCGTTATCTGTTCTCAAGTCCAACTTTAACCCCTGCATCAAGCCTCCCGTTATTATGACTCATCTATCAGCCTGCGGGCGCGGACGGATTTCGCACCCCGAACTCTAACTTACACAAACGATTACGCACGAACTTCGCGAGCGTTTTCCGCAGGCTAACGTGAGAAACTGGGCAAGCATACAAATCGGGCCGACGGGGCAGGTTGACCGTTCTCCACTCCATGGACTAGGAGCCGAGTCACCGATAGGACTGATCTAATCCCGCCTTGCTAAACACAGTGTTACCTGAATCGGACGTAATTCTGGAGCGTGACCTGCTCACTGACACTAGTAATGGAATCAACTGGCGTAGACGTCAGTTATTTTACCTTTCCGTGCGTGCGTGTTCATCACACCCACCGTGTTCATACCATATCGCGTGTTCACCAGTAGGATCAGCCGGAAGCACCACGGCAGTCTCGCGACCTTCTAGTCAGCTCGTGTTCATTCAGATAGCGACGAGAGAGGGTATAGGCGGTGTCTATAACGCCACCGTGTTCACTCCGTTAGAAGACAGCAGCCGATCTGTATTTATTCACGGCCAATCGTGTTCCGTGTTCATGCAGATTACCTCCCCGATCCACTAGGCCGGTCCACTAACTCGAGTGTAGTCCTCTAAACGTGATGATCATCTAAAGCCCTCTCTATGGGATTAGTTGTGCGTCCGGCTGCCCCCGTGTTCACTATACATCGGTAACGGACAAGGCGCCCGTGTTCACCGTGTTCAGCGCGTGTTCATGATCATGCGTGTTCGTGTTCACATCTACGAGTGGGTGAACCCGACGTGTTCAGAGCCCGATGTCCCGGAAACGTGTTCAAGCCTTACATTAACTAAAAGAGTTCACGTGTTCAGTTGATGAACTGGACGTGTTCACGTCCGCGAATCCGAGTGATTCTCACCTCACGGCTAGCCTTTTGGCATGCCATGTTATCCCATCCACGCATGGCAGCTTCACCGTTGCACGAATTGCAGTAGATTTGTGTACTACTCCCAACACGGCCGGGGCCGTCGTCGATTTCTCGTCGACCGGGCAAACCCCTAGAGAAGAGTGGCTAATTGGACTTACCTGCCACTTCGCGGACCTAGATTCACAAACCGATTTCGAACTAGTCGTTGACTTCCTGCGTCGAACCGCACCCCACAAATAACTAAGAACAAATACTAAGGAGACGTTCTGCCATAAACGACGCATGGATTATTATGCTTGCGCGTGGCTAGTACTTTTTCAATTACAGAATGGTATCCCAGGGATAAATGTGCCCGTCATTTTGCGTTCTGATTCATTTTCTTGGACACGTGTCTAGGAAAACTTGCGCGCGGCCACTCTGGTAGAGGCTCTAATCCAAATGCGGGCCCAGTTACACGCGCAATGACGGACACAAGCAAACTACGCCATGTCAAACTACGTTGTCAAACTACGCCAGAAATTACGGAACCTCAAACTACGAAAACAAACTACGCCAAACTACGGGAACCGATCCTCTATAAGCCATCTTAAGGTTCCCCGGACAGTGGTAAACCAAACTACGCTCAACAAACTACGACGGTGAATATCATCCAAACTACGCTCTCAAACTACGCAAGAAACCTACACTGGTTTGCAACGGCTTGATCCGGAAGCAAACTACGAAACTACGCAAACTACGCGACAACTTTGCAATTATCCATAAGCCATATCCATAATCCATAGAGATACCTGAGGGAGGCTTCGTATAACCGACGCAGGACGCGTATCCATACCTATCCATAATACACAGCGAAACACTAAGTACAAACTACGTCGTATCCATACTTTTATCCATAGCTACAAACCGTCTGATAGGAATATTTATCCATATTCAAATATCCATAATATCCACCTTCCGCCTATCTATCCATACATATTATCCATACCGTACACAAACCAAACTACGCTACGGCGCTAGGCCTTGTATCCATAGAATAATTGCGGAATTTGGTTCCTCTCATATCCATATCCATACGGGTCTGCGGAGAGACATGTGCCTTTATCCATAGACCCACGACTGGATCGAGACCGCTTGAATCGGGTATCCATACAGGCGGTTCTTATCCATATAGCATGCCGCTCCTATCCATAAGGACACGATGAGAGCGGCCATAGTATACGGAATTTAGCGTATGGTCAGACCGAAAACCAGAGAGTATCCATAAACCATCTTTATCCATACAAAGCATATTATCCATACGTACTATCCATAGTATCCATACCATTATCCATAAAGGTGCAGCCCATATTCTCTCACAGGCAGAGTCCTAGATTGAGCCGTGTCTTGCCCGCATCATATACCTCCTTGGGCAAGCCCTTGACAGCCATTACCGTCAAGAGCTACGGAGGATTGCGCATGAGTCGTCAAACATTCTTTAACACTGTGCGCCCAGTCAAAAATGCAAAGTGATCGGTCTGTCCAAATATCCTGCAACTCGTAATTCAAAGAATCATGGCACCGGTACAAAATGAAAAGATCAGCTTTCGAATCTCTCTAGAGGTTTTGCCATTTGTCGCATAATCTGGAACGTTATGGCCCCCCGTTCTTTACATGGTGACCCCTTTCCAGTGGCCGTGGCCTATTGTTTAAACTGGGGTTTGTCCCTCGGGGTCTACACGACCGTCCATTCCCCCCCCACGACGAGGACGGAGACGCCTGGTGGTAGACAGTTACCACCGTTCAAATCTAGGGGCGTAATAGGAAAGAAGGACCTTTGGTATTATGAAGAAAGATTCTATAGTATGGTGTGTTTAGTATGGTGGACCTCGGTGGTGTAGTATGGTGCCTCTTTAGTATGGTGGTATGGTGTTCGACAAACCACCTAAAACTAACCTCTTAGTATGGTGCGCTAAGGTAAGGAGTATAACTAGGAGTGGTAGTATGTAGTATGGTGGGGTGAGCGATCAAGACTCATAGTTAGTATGGTGGTATGGTGTACACGGCCGGTCATCCAAACGCATGGATTTTAGGCATCTCATATATAGTATGGTGGAAGTGGATGGGTATAGTATGGTTAGTATGGTGATTTTACTGCTAGTATGGTGGATTTTAACGGGAACCAGAGCGGACGGGTAGTATGGTGCAGGTCTCGCCTAGTATGGTGTGTTTACGGGATTTTACCGGATTTTAGCGTGCGAGGGACGATAGTATGTAGTATGGTGATGGTGGATTTTATAGTATGGTGCGCGACGGCGACGGAAGGATTTTAGGATTTTATAGTATGGTGATTTTAGGATTTTAGGATTCGACGGAAAGGATTTTAGTATGGTGGTATGGTGACAATGCGACGTAGTATGGTGCGACGGAAATGGCCGACCGACGGCGACGGAAAATGGCGTCCAATGGCGTCCACGACGGAAGGCGTCCAATGGCGTCCAATGGCCGACGGAAGTCCAATCGACGGAACGTCCAATGGCGTCCAATGGCGTCCAATGGCGTCCAATGGCGTCCAATGGCCGACGGAAGTCCAATGGCGCGACGGAATCCAATGGCGTCCAATGGCGTCCAATGGCGTCCAATGGCCGACGGAAAAAATGGCGTCCAATCGACGGAAGGCTAGATCGGGGTAGATCGGGGTCGACGGAAAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGCGACGGAATCGGGGTAGATCGGGGTACGACGGAAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGTAGATCGGGGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGGAGGCACGGCCTAGGCAAGAGGCACGGGAGGCCTAGGCAAGCAAGCCTAGCCTAGGCAAGGCCTAGGCAAGAAGGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAACCTAGGCAAGGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGCCTAGGCAAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGCCTAGGCAAGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGGTGGCCTGG" clumps = find_clumps(genome, 10, 499, 16) self.assertEqual( "ACGGGAGGCA AGATCGGGGT AGCCTAGGCA AGGCAAGCCT AGGCACGGGA ATCGGGGTAG CACGGGAGGC CCTAGGCAAG CCTGGTGGCC CGGGAGGCAC CGGGGTAGAT CTAGGCAAGC CTGGTGGCCT GAGGCACGGG GAGGGACCTA GATCGGGGTA GCAAGCCTAG GCACGGGAGG GCCTAGGCAA GCCTGGTGGC GGAGGCACGG GGCAAGCCTA GGCACGGGAG GGCCTGGTGG GGGAGGCACG GGGGTAGATC GGGTAGATCG GGTAGATCGG GGTGGCCTGG GTAGATCGGG GTGGCCTGGT TAGATCGGGG TCGGGGTAGA TGGCCTGGTG TGGTGGCCTG", " ".join(clumps))
def test_find_clumps_with_play_3(self): genome = "1111222111" clumps = find_clumps(genome, 3, 6, 2) self.assertEqual([], clumps)
def test_find_clumps_with_play_1(self): genome = "123122123456789676767" clumps = find_clumps(genome, 2, 7, 3) self.assertEqual(['67'], clumps)
def test_find_clumps_with_sample2(self): genome = "GCGGTTATGCACCGTTCAAATTAGCAAACCACTAAGCGACGTAGTCTGGATTGATTTCTCCCTACCAGTGACCCAAGACGCGTTAGTGAGTTAAGTTCATATCCAGTACCTGCCGCCCTCTGTACTTGGGCGTCCGATTCGCATGCTTACTCAGGTGGAGGACACGATAATCTGATTAAACTGAGCTAAACCAGGTGGAACCAGAAACCAGGTGGGGAGTCTCGCTTCAAGCCGTTCTTGCGATCAAACCAGGTGGTCCATTATGAAACCAGGTGGCTAAACCAGGTGGTCCAGATCCTCGAATGATGTCGGTGCACATCAAAACCAGGTGGGGTGGTGGAACGTAAAACCAGGTGGCATAAACCAGGTGGGCCGGTTCGTAAACCAGGTGAAACCAGGTGGGGTGGAAACCAGGTGGGTTACAAATTACGTTGAGATGGCCCAAACCAGGTGGTGGGCTTCACCCATGTCAACAAACCACCCTATGGAACTAAACCAGGTGGAACCAGGTGGTGAAGGCTTATCCTCAGGAAAAACCAGGTGGAGGTGGTGAAATAAAACCAGGTGGACCAGGTGGATAACCCTCGCCTCGCTTCTCAACCGAGACCTGGATAAACCAGGTGGGGTGGTCCACCGATTTTTGAGACACTAGAAACCAGGTGGGCGGGGAAACCAGGTGGCAAACCAGGTGGGGTGGACGGAAACCAGGTGGATATGTCATAAAACCAAACCAGGTGGTGCACCCCCATGGTGTGTCTTATCCGTGCGTATAAACCAGGTGGTCGCACGGCTTCCACTTGCTGAGAATAGGCCCGCAGGGTCAGTGCCATGCCCTCCGTCACTCGATATGTGTTGTAAGAGTGGTTACCCCTTCATTGAAGTCGCCCACAGCCCCACCTGCATTGCTAGACTATCACCCTACAGTAGGCCTTTTCGCCTTCTTCAAGCAGCAATCTCTTATCCGCGGATGGGCGCGGCGAGCGTGGCGTCCCCGAACATTTTTACCTAACGTGTTTTGTTGGCCGCAAGCCTTCCCTCTAGTCCACCTCAGCCATTCAGCCTAGTAGCTTTCAAGCCGAGCCTTCCATATCTAATGGACCGTCCAGAATTTCACACGTTTCACAGGGCTGTGTTCGACCGCCCGTAATGCTGTTTCACAGGCGATCGCCTTGCGGTTTTTTCACAGATCGCAGCCGATGGACATGCCAACTCGATTTTCACAGAGTTTTTCACAGCGGTTTCACAGCACAGCAGTGATTGTTTCACAGCAATTTTCACTTTCACAGGGGCCCTTTTCACAGCTCAGGGCTCTTTTCACTTTCACAGTTTCACAGCGCTCCTTTCACAGAGCGGGGAAATTTAAGGGAACACTCAAGGGAACAAGGGAACACACAAAGGGAACACAACACAACACATAAGGGAACACTTTCACAGAACACAAAAGTCCGAAATCATCAGCGGCGAAGGGATTTCACAGACAGACACTTTCACAGCGCATTTCACAGATACGTACTTTCACAGGCGTACTTTCACAGACTTTCACAGAGGACAAGCTCAATTTTCACAGACAGGCTGGATAAATTTCACAGCGGTAAGGGTTTCACAGCACACATAAGGGAACACGAATTTCACAGCAGGGAACACCTCTACGAGTAATCTATTACTCTACCTACTGAAGGGAACACACCGAAGACCTACTATTACCTATTACTCTTAAAGGGAACACATTACAAGGGAACACACTCTCTCGTCATATCTCACCTCTCTATTACTCTTAAGGGAACACCTTCTCGATCAACCTATTACTCTATGGAGATAGAGATATTCCAGACATATGGAGATAACATGGAGATATGGAGATAATGGAGATGGAGATAGCTCTTATATTTATCCTATGGAGATATGATACTATTAATGGAGATAATTCTAATGGAGATATAATTACTCTAAGAGGATGGGATCTCGGGCTATTACTCTAATGGAGATAAGCACTATTACTCTAGGAAATGGAGATATGTCAATGGAGATATGTAATGGAGATAGAGGGAGATGGAGTCGCCATTTCATAATCGCCATTTCATAGTTCAGGAATCGCCATTTCCGCCATTTCTAAGATGGAGTCGCCATTTCTACGTATGGAGATAGGATCGCCATTTCATACGACCCGTTGGATATCGCCATTTCCTCGCCATTTCTGGTGACATTTCTCGCCATTTCATTTCTGGAGATAGATGGATCTCGCCATTTCATAGGAATCGCCATTTCCACGTAGGGGGGGCCACAATCCGTAGGTCGGAATTCAGACTCGCCATTTCCCATCGCCATTTCTTCACCTGTATGCCGATCCCTTCGCCATTTCTCATGGAGATAACTCTCTCTCGCCATTTCTCGCCATTTCCATTTCACTCTCATTCGCCATCGCCATTTCCATTCGCCATTTCATCGCCATTTCTTCAGGATAAGATATCGCCATTTCGACTCTCATTCGCATACTGACTCTCATTCTCATCTCGCCATTTCTCATCTGACTCTCATCCTGGGGGAAACTTGCGACTCTCATCACACTTCCGTCGACTCTCATACTGGCGGATAGCATAGGAGCCATTTAAAGACTCTCATTCTCATTCGAGACTCTCATTCAAATCCTACGAGGACTCTCATATAGACTCTCATATCATTACGAGGACTCTCATATACGAGCCATGCATGTGGCGACGACTCTCATCTACGAGCCATGCAAGCAGAATCTACGAGCGACTCTCATTACGAGCCATGTGACCGTACGAGCCATGCATGCATGCCATGCTGACTCTCATCGAGTACGAGCCATGGAAGTTCTTGTTGGTTCGTAGCCCAAGAGCTGAAGTTACGAGCCTACGAGCCATGAAGTTACTTTTACGAGCCATGAAGCTTACGATACGAGCCATGCGAGCCATGCATCCGCGCTACGAGCCATGTTCCAGTACGAGCCATGTTAGTTGCTGAAGTTAAGTTTGGCGCTGAAGTTTGTACGAGCCATGTGCCCGCTGAAGTTTGTTGTACGAGCCATGCATGCTGAAGTTAATGGCTGAAGTTAGCGTTTGCGGGCAGATCCTCATTCTACGATACGAGCCATGCCATGCAGCTGAAGTTAAGTTGGGTTACGAGCCATGCGAGCCATGTGAAGTACGAGCCATGCTGGCTGAAGTTGTTTGTGCTGCTGAAGTTGCTCTTGTCTCTAGCTGAAGTTGCCAACAGGGCTGAAGCTGAAGTTTAAGCTGAAGTTGCGAGCAGGCTGAAGTTATCGGATTGGGGCTGAAGTTCAACCTCCCGTCCCCCCACACTATATTCCCGTCCCCCCCCGCGCACGCGCCGTCTCCCGTCCCCCCTATCCCGTGCGCACGCGACGCGATCCCGTCCCCCCAGAGTGCGCGCACGCGTCCCCCTTCCCGTCCCCCTCTCCCGGGCGCACGCGTCGCTCAACATTTCCGCGCACGCGTCGCGCACGCGGGCGCACGCGGGTCCCGTCCCCCCCCCTCTTCGGCGCACGCGGAATTCCCGTCGCGCACGCGTCCCGTCCCGCGCACGCGTCGCGCACGCGACTGCCCTAACCAACAGTGCGCACGCGCCGGTAACCCGGTAACCCGGTAACCGCGCACGCGGGCGCACGCGCGTAACCCGCGCACGCGCCGCGCACGCGGCCCGGTTCCCGTCCCCCCCGGTAACCCGGTAACTCCCGTCCCCCGTAACCCGGTGCGCACGCGCCCGGCGCACGCGGAGCGCACGCGCCCCCCCCGGTAATAGCGCACGCGCCCGGGCGCACGCGCCCGGTAACCCGGTAACCCGGGCGCGCGCACGCGGCGGCGCACGCGGCGCACGCGGCGCACGCG" clumps = find_clumps(genome, 11, 566, 18) self.assertEqual(['AAACCAGGTGG'], clumps)