def test_boilerpipe_extractor_str(self): r = CharCount() docs = list(r.process([self.d4])) self.assertEqual(docs[0], 23)
def test_boilerpipe_extractor_without_attribute(self): r = CharCount() docs = list(r.process(self.docs)) self.assertEqual(docs[0].document["char_count"], 10) self.assertEqual(docs[1].document["char_count"], 30) self.assertEqual(docs[2].document["char_count"], 23)