def munge_page(fn, regex, out_fn=None, tag='build'): if out_fn is None: out_fn = fn page_lines = [ munge_content(ln, regex) for ln in decode_lines_from_file(fn) if ln is not None ] if len(page_lines) > 0: encode_lines_to_file(out_fn, page_lines) logger.info('{0}: processed {1}'.format(tag, fn)) else: logger.warning('{0}: did not write {1}'.format(tag, out_fn))
def manual_single_html(input_file, output_file): # don't rebuild this if its not needed. if check_dependency(output_file, input_file) is False: logging.info('singlehtml not changed, not reprocessing.') return False else: text_lines = decode_lines_from_file(input_file) regexes = [(re.compile('href="contents.html'), 'href="index.html'), (re.compile('name="robots" content="index"'), 'name="robots" content="noindex"'), (re.compile('href="genindex.html'), 'href="../genindex/')] for regex, subst in regexes: text_lines = [regex.sub(subst, text) for text in text_lines] encode_lines_to_file(output_file, text_lines) logging.info('processed singlehtml file.')
def manual_single_html(input_file, output_file): # don't rebuild this if its not needed. if check_dependency(output_file, input_file) is False: logging.info('singlehtml not changed, not reprocessing.') return False else: text_lines = decode_lines_from_file(input_file) regexes = [ (re.compile('href="contents.html'), 'href="index.html'), (re.compile('name="robots" content="index"'), 'name="robots" content="noindex"'), (re.compile('href="genindex.html'), 'href="../genindex/') ] for regex, subst in regexes: text_lines = [ regex.sub(subst, text) for text in text_lines ] encode_lines_to_file(output_file, text_lines) logging.info('processed singlehtml file.')