def main(): # parse HTML infile = sys.argv[1] inf = file(infile) p = HTMLParser(entities) for n, line in enumerate(inf): try: p.feed(line) except HTMLParseError as err: sys.stderr.write("%s:%d:%d: Parse error: %s\n" % (infile, err.lineno, err.offset, err.msg)) sys.exit(1) except Exception as err: sys.stderr.write("%s:%d:0: Error (%s): %s\n" % (infile, n + 1, repr(err), line)) sys.exit(1) p.close() inf.close() # generate groff sf = StringIO() f = Formatter(infile, sf) f.pp(fix(p.data)) s = sf.getvalue() sf.close() # strip excess whitespace blank_re = re.compile("[ \t\n]*\n([ \t]*\n)*") s = blank_re.sub("\n", s) s = s.lstrip() # write groff outf = file(sys.argv[2], "w") outf.write(s) outf.close()
def main(): # parse HTML infile = sys.argv[1] inf = file(infile) p = HTMLParser(entities) for n, line in enumerate(inf): try: p.feed(line) except HTMLParseError as err: sys.stderr.write('%s:%d:%d: Parse error: %s\n' % (infile, err.lineno, err.offset, err.msg)) sys.exit(1) except Exception as err: sys.stderr.write('%s:%d:0: Error (%s): %s\n' % (infile, n + 1, repr(err), line)) sys.exit(1) p.close() inf.close() # generate groff sf = StringIO() f = Formatter(infile, sf) f.pp(fix(p.data)) s = sf.getvalue() sf.close() # strip excess whitespace blank_re = re.compile("[ \t\n]*\n([ \t]*\n)*") s = blank_re.sub('\n', s) s = s.lstrip() # write groff outf = file(sys.argv[2], 'w') outf.write(s) outf.close()
p = HTMLParser(entities) for n, line in enumerate(inf): try: p.feed(line) except HTMLParseError, err: sys.stderr.write('%s:%d:%d: Parse error: %s\n' % (infile, err.lineno, err.offset, err.msg)) sys.exit(1) except Exception, err: sys.stderr.write('%s:%d:0: Error (%s): %s\n' % (infile, n + 1, repr(err), line)) sys.exit(1) p.close() inf.close() # generate groff sf = StringIO() f = Formatter(infile, sf) f.pp(p.data) s = sf.getvalue() sf.close() # strip excess whitespace blank_re = re.compile("[ \t\n]*\n([ \t]*\n)*") s = blank_re.sub('\n', s) s = s.lstrip() # write groff outf = file(sys.argv[2], 'w') outf.write(s) outf.close() if __name__ == "__main__":