def test_basics(): G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") assert_equal(G.header, "foo bar baz qux".split()) assert_equal(G.files, ["tests/smallcorpus.txt.bz2"]) assert_equal(G.path, "tests/tmp/testcorpus") assert_equal(G.tmppath, "tests/tmp/testcorpus.tmp") assert_equal(os.path.isfile("tests/tmp/testcorpus"), True) G_copy = G.copy() copy_path = G_copy.path assert_not_equal(copy_path, G.path) G_copy.mv_tmp() assert_equal(os.path.isfile(G_copy.path + ".tmp"), True) #G_copy.delete_tmp() #assert_equal(os.path.isfile(G_copy.path + ".tmp"), False) G.make_column("quux", lambda x, y, z, w: "cat", "foo bar baz qux".split()) assert_equal(G.header, "foo bar baz qux quux".split()) for line in G.lines(parts=False): assert_equal(G.extract_columns(line, "quux"), ["cat"]) G.delete_columns("quux") assert_equal(G.header, "foo bar baz qux".split()) G.copy_column("quux", "qux") assert_equal(G.header, "foo bar baz qux quux".split()) for line in G.lines(parts=False): assert_equal(G.extract_columns(line, "qux"), G.extract_columns(line, "quux") ) G.delete() assert_equal(os.path.isfile("tests/tmp/testcorpus"), False)
def test_basics(): G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") assert_equal(G.header, "foo bar baz qux".split()) assert_equal(G.files, ["tests/smallcorpus.txt.bz2"]) assert_equal(G.path, "tests/tmp/testcorpus") assert_equal(G.tmppath, "tests/tmp/testcorpus.tmp") assert_equal(os.path.isfile("tests/tmp/testcorpus"), True) G_copy = G.copy() copy_path = G_copy.path assert_not_equal(copy_path, G.path) G_copy.mv_tmp() assert_equal(os.path.isfile(G_copy.path + ".tmp"), True) #G_copy.delete_tmp() #assert_equal(os.path.isfile(G_copy.path + ".tmp"), False) G.make_column("quux", lambda x, y, z, w: "cat", "foo bar baz qux".split()) assert_equal(G.header, "foo bar baz qux quux".split()) for line in G.lines(parts=False): assert_equal(G.extract_columns(line, "quux"), ["cat"]) G.delete_columns("quux") assert_equal(G.header, "foo bar baz qux".split()) G.copy_column("quux", "qux") assert_equal(G.header, "foo bar baz qux quux".split()) for line in G.lines(parts=False): assert_equal(G.extract_columns(line, "qux"), G.extract_columns(line, "quux")) G.delete() assert_equal(os.path.isfile("tests/tmp/testcorpus"), False)
def test_resum_equal_lazy(): G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") len_G = len(G) total = G.sum_column("qux") G.resum_equal("foo", "qux", assert_sorted=True, keep_all=False, lazy=True) for line in G.lines(): assert_equal(int(G.extract_columns(line, "qux")[0]), total) G.delete() G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") G.resum_equal("foo", "qux", assert_sorted=True, keep_all=True, lazy=True) for line in G.lines(): assert_equal(int(G.extract_columns(line, "qux")[0]), total) G.delete()
def test_resum_equal_lazy(): G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") len_G = len(G) total = G.sum_column("qux") G.resum_equal("foo", "qux", assert_sorted=True, keep_all=False, lazy=True) for line in G.lines(): assert_equal(int(G.extract_columns(line, "qux")[0]), total) G.delete() G = LineFile("tests/smallcorpus.txt.bz2", header="foo bar baz qux".split(), path="tests/tmp/testcorpus") G.resum_equal("foo", "qux", assert_sorted=True, keep_all=True, lazy=True) for line in G.lines(): assert_equal(int(G.extract_columns(line, "qux")[0]), total) G.delete()