def run(filepaths, out_file, s_parsed): # this is the routine called from main() events = PETRreader.read_xml_input(filepaths, s_parsed) # if not s_parsed: # events = utilities.stanford_parse(events) updated_events = do_coding(events, out_file) PETRwriter.write_events(updated_events, 'evts.' + out_file)
def run_pipeline(data, out_file=None, config=None, write_output=True, parsed=False): utilities.init_logger('PETRARCH.log') logger = logging.getLogger('petr_log') if config: print('Using user-specified config: {}'.format(config)) logger.info('Using user-specified config: {}'.format(config)) PETRreader.parse_Config(config) else: logger.info('Using default config file.') logger.info('Config path: {}'.format(utilities._get_data('data/config/', 'PETR_config.ini'))) PETRreader.parse_Config(utilities._get_data('data/config/', 'PETR_config.ini')) read_dictionaries() logger.info('Hitting read events...') events = PETRreader.read_pipeline_input(data) if parsed: logger.info('Hitting do_coding') updated_events = do_coding(events, None) else: events = utilities.stanford_parse(events) updated_events = do_coding(events, None) if not write_output: output_events = PETRwriter.pipe_output(updated_events) return output_events elif write_output and not out_file: print('Please specify an output file...') logger.warning('Need an output file. ¯\_(ツ)_/¯') sys.exit() elif write_output and out_file: PETRwriter.write_events(updated_events, out_file)
def run_pipeline(data, out_file=None, config=None, write_output=True, parsed=False): # this is called externally utilities.init_logger('PETRARCH.log') logger = logging.getLogger('petr_log') if config: print('Using user-specified config: {}'.format(config)) logger.info('Using user-specified config: {}'.format(config)) PETRreader.parse_Config(config) else: logger.info('Using default config file.') logger.info('Config path: {}'.format(utilities._get_data('data/config/', 'PETR_config.ini'))) PETRreader.parse_Config(utilities._get_data('data/config/', 'PETR_config.ini')) read_dictionaries() logger.info('Hitting read events...') events = PETRreader.read_pipeline_input(data) if parsed: logger.info('Hitting do_coding') updated_events = do_coding(events, None) # else: # events = utilities.stanford_parse(events) # updated_events = do_coding(events, None) if not write_output: output_events = PETRwriter.pipe_output(updated_events) return output_events elif write_output and not out_file: print('Please specify an output file...') logger.warning('Need an output file. ¯\_(ツ)_/¯') sys.exit() elif write_output and out_file: PETRwriter.write_events(updated_events, out_file)
def run(filepaths, out_file, s_parsed): logger = logging.getLogger('petr_log') # this is the routine called from main() events = PETRreader.read_xml_input(filepaths, s_parsed) logger.debug("Incoming data from XML: ", events) # if not s_parsed: # events = utilities.stanford_parse(events) updated_events = do_coding(events) PETRwriter.write_events(updated_events, 'evts.' + out_file)
def run(filepaths, out_file, s_parsed): # this is the routine called from main() events = PETRreader.read_xml_input(filepaths, s_parsed) if not s_parsed: events = utilities.stanford_parse(events) updated_events = do_coding(events) if PETRglobals.NullVerbs: PETRwriter.write_nullverbs(updated_events, 'nullverbs.' + out_file) elif PETRglobals.NullActors: PETRwriter.write_nullactors(updated_events, 'nullactors.' + out_file) else: PETRwriter.write_events(updated_events, 'evts.' + out_file)
def run(filepaths, out_file, s_parsed): # this is the routine called from main() events = PETRreader.read_xml_input(filepaths, s_parsed) if not s_parsed: events = utilities.stanford_parse(events) updated_events = do_coding(events, out_file) if PETRglobals.NullVerbs: PETRwriter.write_nullverbs(updated_events, 'nullverbs.' + out_file) elif PETRglobals.NullActors: PETRwriter.write_nullactors(updated_events, 'nullactors.' + out_file) else: PETRwriter.write_events(updated_events, 'evts.' + out_file)
def run(filepaths, out_file, s_parsed): # this is the routine called from main() print(filepaths) events = PETRreader.read_xml_input(filepaths, s_parsed) if not s_parsed: events = utilities.stanford_parse(events) #print("events_input:",events) flag = gna if flag: get_nullactor(events) else: updated_events = do_coding(events) print("update_event:") # print(json.dumps(updated_events, ensure_ascii=False, encoding='utf-8')) if PETRglobals.NullVerbs: output_event = PETRwriter.write_nullverbs(updated_events, 'nullverbs.' + out_file) elif PETRglobals.NullActors: output_event = PETRwriter.write_nullactors(updated_events, 'nullactors.txt') else: output_event = PETRwriter.write_events(updated_events, out_file) return output_event
def run(filepaths, out_file, s_parsed): events = PETRreader.read_xml_input(filepaths, s_parsed) if not s_parsed: events = utilities.stanford_parse(events) updated_events = do_coding(events, out_file) PETRwriter.write_events(updated_events, out_file)