def assertDocumentPagesTransformCorrect(self, transformed_pages, raw_pages, **kwargs): for page, expected_page in zip(transformed_pages, raw_pages): assert page.page_number == expected_page.page_number assert page.angle == adjust_text_angle(expected_page.angle) assert page.width == expected_page.width assert page.height == expected_page.height assert page.unit == expected_page.unit for line, expected_line in zip(page.lines or [], expected_page.lines or []): self.assertDocumentLineTransformCorrect(line, expected_line) for word, expected_word in zip(page.words or [], expected_page.words or []): self.assertDocumentWordTransformCorrect(word, expected_word) for selection_mark, expected_selection_mark in zip( page.selection_marks or [], expected_page.selection_marks or []): self.assertDocumentSelectionMarkTransformCorrect( selection_mark, expected_selection_mark) for span, expected_span in zip(page.spans or [], expected_page.spans or []): self.assertSpanTransformCorrect(span, expected_span)
def assertFormPagesTransformCorrect(self, form_pages, read_result, page_result=None, **kwargs): for page, expected_page in zip(form_pages, read_result): if hasattr(page, "pages"): # this is necessary for how unlabeled forms are structured page = page.pages[0] self.assertEqual(page.page_number, expected_page.page) self.assertEqual(page.text_angle, adjust_text_angle(expected_page.angle)) self.assertEqual(page.width, expected_page.width) self.assertEqual(page.height, expected_page.height) self.assertEqual(page.unit, expected_page.unit) for line, expected_line in zip(page.lines or [], expected_page.lines or []): self.assertFormLineTransformCorrect(line, expected_line) for selection_mark, expected_selection_mark in zip(page.selection_marks or [], expected_page.selection_marks or []): self.assertFormSelectionMarkTransformCorrect(selection_mark, expected_selection_mark) if page_result: for page, expected_page in zip(form_pages, page_result): if hasattr(page, "pages"): # this is necessary for how unlabeled forms are structured page = page.pages[0] if expected_page.tables: self.assertTablesTransformCorrect(page.tables, expected_page.tables, read_result, **kwargs)