def get_frequent_splits(): forest = RandomForest(num_trees=100, max_depth=2) forest.train(training_data, training_labels) lst = forest.most_frequent_first_splits() for item in lst: word = ' < ' split, frequency = item feature, value = split name = feature_names[feature] print(name + word + str(value) + ' (' + str(frequency) + ' trees)')
def get_frequent_splits(): forest = RandomForest(num_trees = 100, max_depth = 2, categorical_vars = cat_set) forest.train(training_data, training_labels) lst = forest.most_frequent_first_splits() for item in lst: word = ' < ' split, frequency = item feature, value = split if feature in cat_set: value = inverse_list[feature - CONTINUOUS_FEATURES][value] word = ' is ' name = feature_names[feature] print(name + word + str(value) + ' (' + str(frequency) + ' trees)')