def test_async(self): directory = './resources' payslips = analyser.get_payslips(directory, 'pdf') payslips_dir = ["{}/{}".format(directory, slip) for slip in payslips] rv = analyser.asynchronously_convert_pdfs(payslips_dir, "./images") self.assertListEqual( sorted(rv), sorted(analyser.get_payslips('./images', 'jpg', True)))
def test_tesseract(self): directory = './images' payslips = analyser.get_payslips(directory, 'jpg') payslips_dir = ["{}/{}".format(directory, slip) for slip in payslips] rv = analyser.asynchronously_convert_pdfs(payslips_dir, "./images") images = analyser.get_payslips('./images', 'jpg', True) rv = analyser.asynchronously_tesseract_images(rv) jpegs = analyser.get_payslips('./images', 'jpg', True) print(rv) # self.assertListEqual(sorted(rv), sorted(jpegs)) self.assertEqual("a", "a")
def test_tesseract(self): directory = './images' payslips = analyser.get_payslips(directory, 'jpg') payslips_dir = ["{}/{}".format(directory, slip) for slip in payslips] rv = analyser.asynchronously_convert_pdfs(payslips_dir, "./images") images = analyser.get_payslips('./images', 'jpg', True) rv = analyser.asynchronously_tesseract_images(rv) jpegs = analyser.get_payslips('./images', 'jpg', True) print(rv) # self.assertListEqual(sorted(rv), sorted(jpegs)) self.assertEqual("a", "a")
def test_async(self): directory = './resources' payslips = analyser.get_payslips(directory, 'pdf') payslips_dir = ["{}/{}".format(directory, slip) for slip in payslips] rv = analyser.asynchronously_convert_pdfs(payslips_dir, "./images") self.assertListEqual(sorted(rv), sorted(analyser.get_payslips('./images', 'jpg', True)))