Ejemplo n.º 1
0
def extract_links_to_embedded_content(main_content):
    items = main_content.findAll("div", {"class": "embedContents"})
    embedded_links = list()
    for item in items:
        tagged_url = ipm_utils.extract_tagged_url_from_embedded_item(item, DHNET_NETLOC, DHNET_INTERNAL_SITES)
        if tagged_url is not None:
            embedded_links.append(tagged_url)
    return embedded_links
Ejemplo n.º 2
0
def extract_embedded_content_links(main_content):
    items = main_content.findAll('div', {'class': 'embedContents'})
    extracted = [ipm_utils.extract_tagged_url_from_embedded_item(item, LALIBRE_NETLOC, LALIBRE_ASSOCIATED_SITES) for item in
                 items]
    return [_ for _ in extracted if _]