def testScannedPdfPage(self): pdfToText = PdfToText('tests/sample-scanned.pdf', 5, self.outdir) pdfToText.extractPage(2) self.assertTrue(os.path.isfile(os.path.join(self.outdir,"2.txt")))
def testScannedPdfPage(self): pdfToText = PdfToText('tests/sample-scanned.pdf', 5, self.outdir) pdfToText.extractPage(2) self.assertTrue(os.path.isfile(os.path.join(self.outdir, "2.txt")))
def testStructuredPdfPage(self): pdfToText = PdfToText('tests/sample.pdf', 5, self.outdir) pdfToText.extractPage(1) self.assertTrue(os.path.isfile(os.path.join(self.outdir,"1.txt")))
def testStructuredPdfPage(self): pdfToText = PdfToText('tests/sample.pdf', 5, self.outdir) pdfToText.extractPage(1) self.assertTrue(os.path.isfile(os.path.join(self.outdir, "1.txt")))