def _clean_html(self, html): """Normalize the retrieve html.""" html = re_spaces.sub(' ', html) return subXMLRefs(html)
def _clean_html(self, html): """Normalize the retrieve html.""" html = re_spaces.sub(' ', html) # Remove silly » chars. html = html.replace(' »', '') return subXMLRefs(html)