def testMultiLen(self): s = Shingler(2,3) shingles = set(s.shingle("abcdef")) self.assertSetEqual(set(map(tuple, ["ab", "bc","cd","de","ef","abc","bcd","cde","def"])), shingles) self.assertSetEqual(set([('a','b',),('b','c',),('a','b','c',)]), set(s.shingle("abc"))) self.assertSetEqual(set([('a','b',),(None,'a','b',)]), set(s.shingle("ab"))) self.assertSetEqual(set([(None,'a',),(None,None,'a',)]), set(s.shingle("a")))
def testLenTwo(self): s = Shingler(2) shingles = list(s.shingle("abcdef")) self.assertListEqual(map(tuple, ["ab", "bc", "cd","de", "ef"]), shingles) self.assertListEqual([(None,'a',)], list(s.shingle("a"))) self.assertListEqual([('a','b',)], list(s.shingle("ab")))
def testLenOne(self): s = Shingler(1) shingles = list(s.shingle("abcdef")) self.assertListEqual(map(tuple, "abcdef"), shingles) self.assertListEqual([('a',)], list(s.shingle("a")))