def test_names_and_tags(self): names, tags = list(es.check_names_and_tags([u"ебь гсей", u"еленна скрыник", u"елена скрынник"], [u"лобби", u"браат", u"двоюр"])) self.assertEquals(len(names), 3) self.assertEquals(names[0], False) self.assertEquals(names[1], u"елена скрынник") self.assertEquals(names[2], True) self.assertEquals(len(tags), 3) self.assertEquals(tags[0], True) self.assertEquals(tags[1], False) self.assertEquals(tags[2], False)
def test_names_and_tags(self): names, tags = list( es.check_names_and_tags( [u"ебь гсей", u"еленна скрыник", u"елена скрынник"], [u"лобби", u"браат", u"двоюр"])) self.assertEquals(len(names), 3) self.assertEquals(names[0], False) self.assertEquals(names[1], u"елена скрынник") self.assertEquals(names[2], True) self.assertEquals(len(tags), 3) self.assertEquals(tags[0], True) self.assertEquals(tags[1], False) self.assertEquals(tags[2], False)
def check_names_tags(bucks): names = set([x[0] for x in bucks] + [x[1] for x in bucks]) #names = list(names) + [n[1] + " " + n[0] for n in map(unicode.split, names)] tags = set(sum([x[2] for x in bucks], [])) n, t = es.check_names_and_tags(names, tags) names_n = dict(zip(names, n)) tags_n = dict(zip(tags, t)) res = [] for idx, buck in enumerate(bucks): name_1 = buck[0] name_2 = buck[1] link_types = buck[2] sim_names = [names_n[name_1], names_n[name_2]] if isinstance(sim_names[0], basestring): res.append((idx, u"STR_SIMILAR_NAME:{},{}".format(name_1,sim_names[0]))) if isinstance(sim_names[1], basestring): res.append((idx, u"STR_SIMILAR_NAME:{},{}".format(name_2,sim_names[1]))) false_tags = filter(lambda x: tags_n[x] == False, link_types) if len(false_tags) > 0: res.append((idx, u"STR_TAG_NOT_FOUND:{}".format(",".join(false_tags)))) return res
def check_names_tags(bucks): names = set([x[0] for x in bucks] + [x[1] for x in bucks]) #names = list(names) + [n[1] + " " + n[0] for n in map(unicode.split, names)] tags = set(sum([x[2] for x in bucks], [])) n, t = es.check_names_and_tags(names, tags) names_n = dict(zip(names, n)) tags_n = dict(zip(tags, t)) res = [] for idx, buck in enumerate(bucks): name_1 = buck[0] name_2 = buck[1] link_types = buck[2] sim_names = [names_n[name_1], names_n[name_2]] if isinstance(sim_names[0], basestring): res.append( (idx, u"STR_SIMILAR_NAME:{},{}".format(name_1, sim_names[0]))) if isinstance(sim_names[1], basestring): res.append( (idx, u"STR_SIMILAR_NAME:{},{}".format(name_2, sim_names[1]))) false_tags = filter(lambda x: tags_n[x] == False, link_types) if len(false_tags) > 0: res.append( (idx, u"STR_TAG_NOT_FOUND:{}".format(",".join(false_tags)))) return res
def __init__(self, names, tags): n, t = es.check_names_and_tags(names, tags) self.names = dict(zip(names, n)) self.tags = dict(zip(tags, t))