def parse_xml(directory): for xmlfile in os.listdir(directory): file_name = re.sub('.xml$', '', os.path.basename(xmlfile)) #print 'parsing...' #print parse_parser_xml_results(open(os.path.join(directory, xmlfile), 'r').read(), file_name, raw_output=False) print file_name yield ParsedOutput(parse_parser_xml_results(open(os.path.join(directory, xmlfile), 'r').read(), file_name, raw_output=False))
def dcoref_opener(file_path, fname): with open(os.path.join(file_path, fname + ".raw.xml"), "r") as f_in: nlp = parse_parser_xml_results(f_in.read()) all_coref_groups = [] for group in nlp["coref"]: chain = set() for pair in group: for i in pair: chain.add((i[0], i[1], i[3], i[4])) all_coref_groups.append(chain) return all_coref_groups
def dcoref_opener(file_path, fname): with open(os.path.join(file_path, fname+".raw.xml"), "r") as f_in: nlp = parse_parser_xml_results(f_in.read()) all_coref_groups = [] for group in nlp["coref"]: chain = set() for pair in group: for i in pair: chain.add((i[0], i[1], i[3], i[4])) all_coref_groups.append(chain) return all_coref_groups
def open_and_parse_xml_file(self, file_name): with open(file_name, "r") as f_in: return parse_parser_xml_results(f_in.read())
def stanford_general_opener(file_path, f_name): with open(os.path.join(file_path, f_name+".head.coref.raw.xml"), "r") as f_in: return parse_parser_xml_results(f_in.read())
def stanford_general_opener(file_path, f_name): with open(os.path.join(file_path, f_name + ".head.coref.raw.xml"), "r") as f_in: return parse_parser_xml_results(f_in.read())