def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() plot_classification_frequency(classification_data) plot_feature_correlation(feature_data) plot_feature_distribution(feature_data, classification_data)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform(classification_data) test_naive_bayes(feature_data, classification_data_numerical)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform( classification_data) test_naive_bayes(feature_data, classification_data_numerical)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform(classification_data) plot_accuracy_vs_folds(feature_data, classification_data_numerical) optimise_knn_parameters(feature_data, classification_data_numerical)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform( classification_data) plot_accuracy_vs_folds(feature_data, classification_data_numerical) optimise_knn_parameters(feature_data, classification_data_numerical)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform(classification_data) test_nearest_neighbors(feature_data, classification_data_numerical) optimise_nearest_neighbours(feature_data, classification_data_numerical) validation_metrics(feature_data, classification_data_numerical) plot_accuracies(feature_data, classification_data_numerical) plot_decision_boundaries(feature_data, classification_data_numerical)
def main(): """ Main function of the script. """ feature_data, classification_data = wdbc.load_data_set() # scikit-learn functions require classification in terms of numerical # values (i.e. 0, 1, 2) instead of strings (e.g. 'benign', 'malignant') label_encoder = preprocessing.LabelEncoder() label_encoder.fit(classification_data) classification_data_numerical = label_encoder.transform( classification_data) test_nearest_neighbors(feature_data, classification_data_numerical) optimise_nearest_neighbours(feature_data, classification_data_numerical) validation_metrics(feature_data, classification_data_numerical) plot_accuracies(feature_data, classification_data_numerical) plot_decision_boundaries(feature_data, classification_data_numerical)