def test_lazy_cuts_combine_split_issue(): # Test for lack of exception cuts = DummyManifest(CutSet, begin_id=0, end_id=1000) with TemporaryDirectory() as d, NamedTemporaryFile(suffix=".jsonl.gz") as f: cuts.to_file(f.name) f.flush() cuts_lazy = load_manifest_lazy(f.name) cuts_lazy = combine(cuts_lazy, cuts_lazy.perturb_speed(0.9)) cuts_lazy.split_lazy(d, chunk_size=100)
def test_cut_set_subset_cut_ids_preserves_order_with_lazy_manifest(): cuts = DummyManifest(CutSet, begin_id=0, end_id=1000) cut_ids = ["dummy-cut-0010", "dummy-cut-0171", "dummy-cut-0009"] with NamedTemporaryFile(suffix=".jsonl.gz") as f: cuts.to_file(f.name) cuts = cuts.from_jsonl_lazy(f.name) subcuts = cuts.subset(cut_ids=cut_ids) cut1, cut2, cut3 = subcuts assert cut1.id == "dummy-cut-0010" assert cut2.id == "dummy-cut-0171" assert cut3.id == "dummy-cut-0009"