def test_clean(self): scanner = PDFScanner(None) phrase = "0a1§2!3à4k5L6P7&8é9a" phrase = scanner.clean(phrase) self.assertEqual(phrase, "0123456789")
def test_extract_isbn(self): pdf = file("tests/data/test_book-1.pdf", 'rb') scanner = PDFScanner(pdf) scanner.extractISBN() isbn13 = scanner.isbn13 self.assertEqual(isbn13, "9783161484100") isbn10 = scanner.isbn10 self.assertEqual(isbn10, "316148410X")
def test_searchCodeInPage(self): scanner = PDFScanner(None) # Test 1 page = read_file("tests/data/test_no-isbn.txt") code = scanner.searchCodeInPage(page) self.assertEqual(code, "") # Test 2 page = read_file("tests/data/test_isbn-1.txt") code = scanner.searchCodeInPage(page) self.assertEqual(code, "0123456789012") # Test 3 page = read_file("tests/data/test_isbn-2.txt") code = scanner.searchCodeInPage(page) self.assertEqual(code, "0123456789012") # Test 4 page = read_file("tests/data/test_isbn-3.txt") code = scanner.searchCodeInPage(page) self.assertEqual(code, "9876543212346") # Test 5 page = read_file("tests/data/test_isbn-4.txt") code = scanner.searchCodeInPage(page) self.assertEqual(code, "0201633612")