def Reduce_Nmers(Info): print 'COMPUTING Nmers ....' mseqs = ReduceInfo2seqs(Info,70, lambda L: MotifTools.top_nmers(6,L)[0:3]) print "Combining representative sequences...: " for i in range(len(mseqs)): i = i + 1 print '\t%s'%mseqs[i-1], if (i%5 == 0): print print top_seq_pairs = MotifTools.top_nmers(5,mseqs,1) total_nmers = 0 for (mner,count) in top_seq_pairs: total_nmers = total_nmers + count for (nmer,count) in top_seq_pairs[0:8]: print "RESULT: %s\t%2d (%5.2f%%) occurences: "%(nmer,count, 100*float(count)/total_nmers), for bsite in Info.query['bsites']: seq = bsite.cleantxt() (max,s1,s2) = MotifTools.compare_seqs(nmer,seq) print ' %s vs %s %4.2f correct'%(s1,s2,max)