def test_second_apply_removes_previous_segments(self): filt = Filter(**self.basic_kwargs()) segmentstorage = self.segmentstorage() filt.apply(segmentstorage, self.documentstorage()) filt.apply(segmentstorage, self.documentstorage()) # second apply copies = set(segmentstorage.load(name=u'lemma:copy')) self.assertEqual(copies, set(self.first_copy_lemmas()) | set(self.second_copy_lemmas()))
def apply_filter(self, name): try: settings = self._setstorage.load(encode_name(name)) filt = Filter(**settings) filt.apply(self._segstorage, self._docstorage) except Exception, e: return json.dumps({"result": "FAIL", "error": str(e)})
def test_basic_creation(self): kwargs = self.basic_kwargs() kwargs[SEGMENT_VALUE_REGEX] = u'was|sick|\d+' kwargs[SEGMENT_NEG_REGEX] = u'was' kwargs[OUTPUT_NAME] = u'lemma' kwargs[CREATES_SEGMENT] = True segmentstorage = SegmentStorage() filt = Filter(**kwargs) filt.apply(segmentstorage, self.documentstorage()) segs = segmentstorage.load(name=u'lemma') self.assertEqual(set(segs), set([self.lemma3(), self.lemma7()]))