示例#1
0
    def get_summarised_data(self):
        print('Analysing data...')
        pages = Miner.get_page_objids(pdf_path=self.filename)
        print('[1/6]')
        toc, document = self.get_toc()
        print('[2/6]')
        toc_level = self.get_level(toc=toc, level=1)
        print('[3/6]')

        # from IPython import embed
        # embed()
        # sys.exit()

        toc_level_pages = self.pagify(toc_level, pages)
        print('[4/6]')
        toc_level_ranged = self.add_range(toc_level_pages)
        print('[5/6]')
        final_toc = self.add_content(toc_level_ranged)
        print('[6/6]')

        return final_toc