def test_getting_tables_from_pptx(self): granulator = GranulateOpenXML(File(data=TWO_TABLES_PPTX_DATA, filename='two_tables.pptx')) files_with_single_tables = granulator.getTableDocumentList() first_file = files_with_single_tables[0] document_xml = first_file.read('word/document.xml') xml_root = etree.fromstring(document_xml) tbl_tags = xml_root.xpath('//w:tbl', namespaces=xml_root.nsmap) self.assertEquals(len(tbl_tags), 1) self.assertEquals(len(files_with_single_tables), 2)
def test_get_thumbnails_from_pptx(self): granulator = GranulateOpenXML(File(data=TWO_TABLES_PPTX_DATA, filename='two_tables.pptx')) thumbnails_pptx = granulator.getThumbnailsDocument() self.assertEquals(thumbnails_pptx.getvalue(), THUMBNAILS_PPTX_DATA)
def test_get_thumbnails_from_docx(self): granulator = GranulateOpenXML(File(data=THREE_TABLES_DOCX_DATA, filename='three_tables.docx')) thumbnails_docx = granulator.getThumbnailsDocument() self.assertEquals(thumbnails_docx.getvalue(), THUMBNAILS_DOCX_DATA)
def test_getting_images_from_pptx(self): granulator = GranulateOpenXML(File(data=PPTX_DATA, filename='test_1image.pptx')) images = granulator.getImageDocumentList() self.assertEquals(len(images), 1) self.assertEquals(FIRST_PPTX_IMAGE, images[0].getvalue())
def test_getting_images_from_docx(self): granulator = GranulateOpenXML(File(data=DOCX_DATA, filename='test_27images.docx')) images = granulator.getImageDocumentList() self.assertEquals(len(images), 27) self.assertEquals(FIRST_DOCX_IMAGE, images[0].getvalue())