def test_nearest_neighbors(self): ngrams = NGramSpace(1) docs = [ngrams.parse(raw) for raw in test_docs] c = Clustering(docs) c.pp_distance(range(0, len(test_docs))) self.assertEqual([1], c.closest_neighbors([0], 1)) self.assertEqual([1, 2], c.closest_neighbors([0], 2)) self.assertEqual([1, 2, 3], c.closest_neighbors([0], 3)) self.assertEqual([1, 2, 3, 5], c.closest_neighbors([0], 4)) self.assertEqual([5], c.closest_neighbors([3, 4], 1)) self.assertEqual([5, 1], c.closest_neighbors([3, 4], 2))