Esempio n. 1
0
 def _clean_html(self, html):
     """Normalize the retrieve html."""
     html = re_spaces.sub(' ', html)
     return subXMLRefs(html)
Esempio n. 2
0
 def _clean_html(self, html):
     """Normalize the retrieve html."""
     html = re_spaces.sub(' ', html)
     # Remove silly  » chars.
     html = html.replace(' »', '')
     return subXMLRefs(html)
Esempio n. 3
0
 def _clean_html(self, html):
     """Normalize the retrieve html."""
     html = re_spaces.sub(' ', html)
     return subXMLRefs(html)