def iter_links_domain(record): """ Transforms Row(d1="x.com", d2="y.com") into tuple([int64 ID], [int64 ID]) """ d1 = record["d1"] d2 = record["d2"] if not d1 or not d2: return [] try: from_domain = _fast_make_domain_id(d1) to_domain = _fast_make_domain_id(d2) except Exception: # pylint: disable=broad-except return [] if from_domain == to_domain: return [] else: return [(py2_long(from_domain), py2_long(to_domain))]
def iter_domain(record): """ Transforms Row(domain=www.example.com) into tuple([int64 ID], "example.com") """ domain = record["domain"] if not domain or not domain.strip(): return [] name = URL("http://" + domain).normalized_domain try: _id = _fast_make_domain_id(name) except Exception: # pylint: disable=broad-except return [] return [(py2_long(_id), str(name))]