def modifyShakespeare(file_in, file_out): builder = FileBuilder(file_in, file_out) builder.remove_lines(line_last, len(builder)) builder.remove_lines(0, line_first) builder.remove_repeated_empty_lines() builder.remove_lines_within("<<", ">>") builder.remove_number_lines(6) builder.sub('[<}`\r]', '') builder.sub('[|_]', ' ') char_words = [ '!', '"', '&', '(', ')', ',', '-', '.', ':', ';', '?', '[', ']', '\n' ] builder.to_words(char_words) builder.to_words_apostrophes() builder.to_lowercase() builder.strip_lines()
def test_strip(): builder = FileBuilder("../test_text/strip.txt", outfile) builder.strip_lines() assert builder[0] == "hello\n" assert builder[1] == "world\n" assert builder[2] == "ok\n"