def make_single_file_featureset_data(): """ Write a training file and a test file for tests that check whether specifying train_file and test_file actually works. """ train_fs, test_fs = make_classification_data(num_examples=600, train_test_ratio=0.8, num_labels=2, num_features=3, non_negative=False) # Write training feature set to a file train_path = join(_my_dir, 'train', 'train_single_file.jsonlines') writer = NDJWriter(train_path, train_fs) writer.write() # Write test feature set to a file test_path = join(_my_dir, 'test', 'test_single_file.jsonlines') writer = NDJWriter(test_path, test_fs) writer.write() # Also write another test feature set that has fewer features than the training set test_fs.filter(features=['f01', 'f02']) test_path = join(_my_dir, 'test', 'test_single_file_subset.jsonlines') writer = NDJWriter(test_path, test_fs) writer.write()
def make_single_file_featureset_data(): """ Write a training file and a test file for tests that check whether specifying train_file and test_file actually works. """ train_fs, test_fs = make_classification_data(num_examples=600, train_test_ratio=0.8, num_labels=2, num_features=3, non_negative=False) # Write training feature set to a file train_path = join(_my_dir, 'train', 'train_single_file.jsonlines') writer = NDJWriter(train_path, train_fs) writer.write() # Write test feature set to a file test_path = join(_my_dir, 'test', 'test_single_file.jsonlines') writer = NDJWriter(test_path, test_fs) writer.write()