def feed(self, entity): if not settings.ANALYZE_ENTITIES: return if not entity.schema.is_a(ANALYZABLE): return # HACK: Tables should be mapped, don't try to tag them here. if entity.schema.is_a("Table"): return texts = entity.get_type_values(registry.text) for text in text_chunks(texts): detect_languages(self.entity, text) for (prop, tag) in extract_entities(self.entity, text): self.aggregator_entities.add(prop, tag) for (prop, tag) in extract_patterns(self.entity, text): self.aggregator_patterns.add(prop, tag)
def feed(self, entity): if not settings.ANALYZE_ENTITIES: return # TODO: should we have a schema called "Taggable" with # the XXmentioned properties? if not entity.schema.is_a('Document'): return # HACK: Tables will be mapped, don't try to tag them here. if entity.schema.is_a('Table'): return texts = entity.get_type_values(registry.text) for text in text_chunks(texts): detect_languages(self.entity, text) for (prop, tag) in extract_entities(self.entity, text): self.aggregator.add(prop, tag) for (prop, tag) in extract_patterns(self.entity, text): self.aggregator.add(prop, tag)