def test_encode(filename, seq_length, text): dataset = Dataset([filename], seq_length) encoded = dataset.encode(text) assert len(encoded) == len(text) for label in encoded: assert sum(label) == 1 assert len(label) == dataset.vocab_size
def test_decode(filename, seq_length, text): dataset = Dataset([filename], seq_length) assert dataset.decode(dataset.encode(text)) == text