def test_excel(): # flow = ExampleOCRFlow("test/excel_demo.yaml") flow = OCRFlow("test/excel_demo.yaml") flow.download_from_excel() flow.transform_documents() flow.extract_fields() return flow
def test_advanced(): flow = OCRFlow("test/advanced.yaml") # flow = ExampleOCRFlow("test/advanced.yaml") flow.download_from_excel() flow.transform_documents() flow.extract_fields() return flow
def test_pdftext(): # flow = OCRFlow("test/pdftext.yaml") flow = OCRFlow("test/edcon.yaml") flow.download_from_excel() flow.transform_documents() return flow
def test_multipage(): flow = OCRFlow("test/multipage.yaml") flow.download_from_excel() flow.transform_documents() flow.extract_fields() return flow
def serve_flask(): flaskapp.run( host="0.0.0.0", port=5000) if __name__ == "__main__": try: config_filename = sys.argv[1] except: config_filename = "test/excel_demo.yaml" # config_filename = "test/multipage.yaml" # config_filename = "test/advanced.yaml" with open("logging.yaml") as fh: log_settings = yaml.load(fh) logging.config.dictConfig(log_settings) LOGGER = logging.getLogger(__name__) LOGGER.info("Logging enabled") flaskapp.secret_key = 'super secret key' flow = OCRFlow(config_filename) # flow.upload_sample_documents() if "excel_file" in flow.settings: flow.download_from_excel() if "cmis_url" in flow.settings: flow.download_from_cmis() flow.transform_documents() flow.extract_fields() serve_gevent() LOGGER.info("Web server started")