Exemple #1
0
def cleanHtml(content):
    soup = BeautifulSoup(content)

    soup = removeJavascript(soup)
    soup = replaceEmbedsWithIframes(soup)
    soup = removeViewFromImages(soup)
    soup = removeStylesFromInlineImages(soup)
    soup = removeWidthHeightFromInlineImages(soup)

    return unicode(soup)