Beispiel #1
0
    def GetParsedData(self):
        encoding = self.req_response.headers.getparam("charset")
        parsed_data = None
        if encoding:
            parsed_data = self.req_response.read().decode(encoding)
        else:
            parsed_data = self.req_response.read()

        parser = MyHtmlParser()
        parser.feed(parsed_data)

        return parser
class TestParser(unittest.TestCase):
  def setUp(self):
    self.parser = MyHtmlParser()

  def test_finds_css_links(self):
      self.parser.feed('<link rel="stylesheet" href="/style.css" />')
      self.assertEqual(self.parser.css, ['/style.css'])

  def test_finds_js_script_links(self):
    self.parser.feed('<script src="/launch.js" />')
    self.assertEqual(self.parser.scripts, ['/launch.js'])

  def test_finds_url_links(self):
    self.parser.feed('<a href="http://www.google.com/" />')
    self.assertEqual(self.parser.links, ['http://www.google.com/'])

  def test_finds_embedded_images(self):
    self.parser.feed('<img src="/icon.jpeg" />')
    self.assertEqual(self.parser.images, ['/icon.jpeg'])