示例#1
0
    def test_parse_text(self):
        from string import ascii_letters

        p = Page(config.fake_server('image1.html'))
        for i, image in enumerate(p.images()):
            label = image.src.leaf()[4]

            if label != 'y':
                self.assertEqual(label, ascii_letters[i])
                self.assertEqual((i + 1) * 10, image.width)
                self.assertEqual((i + 1) * 20, image.height)
                self.assertEqual(label, image.title[-1])
                self.assertEqual(label, image.alt[-1])

        p = Page(config.fake_server('bad_image.html'))
        bads = list(p._get_tree().xpath('//img'))

        bad_img = HTMLImage.from_element(bads[0])
        self.assertEqual(bad_img.width, 11)
        self.assertEqual(bad_img.height, 12)

        bad_img = HTMLImage.from_element(bads[1])
        self.assertTrue(bad_img.width is None)
        self.assertTrue(bad_img.height is None)
示例#2
0
    def test_parse_text(self):
        from string import ascii_letters

        p = Page(config.fake_server("image1.html"))
        for i, image in enumerate(p.images()):
            label = image.src.leaf()[4]

            if label != "y":
                self.assertEqual(label, ascii_letters[i])
                self.assertEqual((i + 1) * 10, image.width)
                self.assertEqual((i + 1) * 20, image.height)
                self.assertEqual(label, image.title[-1])
                self.assertEqual(label, image.alt[-1])

        p = Page(config.fake_server("bad_image.html"))
        bads = list(p._get_tree().xpath("//img"))

        bad_img = HTMLImage.from_element(bads[0])
        self.assertEqual(bad_img.width, 11)
        self.assertEqual(bad_img.height, 12)

        bad_img = HTMLImage.from_element(bads[1])
        self.assertTrue(bad_img.width is None)
        self.assertTrue(bad_img.height is None)
示例#3
0
 def xxx_test_extract_text(self):
     # XXX
     i = Image(config.fake_server('images/test_ocr.jpg'))
     self.assertEquals(i.text().rstrip(), 'Hello World!')
示例#4
0
 def test_entropy(self):
     with config.fake_proxy():
         i = Image('http://www.cs.unc.edu/~karl/me.jpg')
         self.assertAlmostEquals(i.entropy(), 8.67911685935)
         i = Image(config.fake_server('images/test_ocr.jpg'))
         self.assertAlmostEquals(i.entropy(), 5.2323108617)
示例#5
0
 def test_entropy(self):
     i = Image(config.fake_server('images/test_ocr.jpg'))
     self.assertAlmostEquals(i.entropy(), 5.2323108617)
示例#6
0
 def xxx_test_extract_text(self):
     # XXX
     i = Image(config.fake_server("images/test_ocr.jpg"))
     self.assertEquals(i.text().rstrip(), "Hello World!")
示例#7
0
 def test_entropy(self):
     with config.fake_proxy():
         i = Image("http://www.cs.unc.edu/~karl/me.jpg")
         self.assertAlmostEquals(i.entropy(), 8.67911685935)
         i = Image(config.fake_server("images/test_ocr.jpg"))
         self.assertAlmostEquals(i.entropy(), 5.2323108617)
示例#8
0
 def test_entropy(self):
     i = Image(config.fake_server("images/test_ocr.jpg"))
     self.assertAlmostEquals(i.entropy(), 5.2323108617)