def test_shuffle_with_seed(tmpdir): da = DocumentArrayMemmap(tmpdir) docs = list(random_docs(100)) da.extend(docs) shuffled_1 = da.shuffle(seed=1) shuffled_2 = da.shuffle(seed=1) shuffled_3 = da.shuffle(seed=2) assert len(shuffled_1) == len(shuffled_2) == len(shuffled_3) == len(da) assert shuffled_1 == shuffled_2 assert shuffled_1 != shuffled_3
def test_shuffle(tmpdir): da = DocumentArrayMemmap(tmpdir) docs = list(random_docs(100)) da.extend(docs) shuffled = da.shuffle() assert len(shuffled) == len(da) assert isinstance(shuffled, DocumentArray) ids_before_shuffle = [d.id for d in da] ids_after_shuffle = [d.id for d in shuffled] assert ids_before_shuffle != ids_after_shuffle assert sorted(ids_before_shuffle) == sorted(ids_after_shuffle)