def generate_dataset(items, slots, voca: Vocabulary): dataset = Dataset() for item in items: vectors = [] for word in item[0].split(): vectors.append(voca.get(word)) labels = [] for tag in item[1].split(): value = np.zeros([len(slots)], dtype=np.float32) value[slots.index(tag)] = 1 labels.append(value) dataset.add(item[0], item[1], vectors, labels) return dataset