def test_remove_empty_user_reviews(self): actual_value = extractor.remove_empty_user_reviews( reviews_matrix_emtpy) self.assertEqual(reviews_matrix_non_emtpy, actual_value) actual_value = extractor.remove_empty_user_reviews( reviews_matrix_emtpy[4:]) self.assertEqual([], actual_value)
def test_remove_empty_user_reviews(self): actual_value = extractor.remove_empty_user_reviews( reviews_matrix_emtpy) self.assertEqual(reviews_matrix_non_emtpy, actual_value) actual_value = extractor.remove_empty_user_reviews( reviews_matrix_emtpy[4:]) self.assertEqual([], actual_value)
def clean_reviews(reviews): """ Returns a copy of the original reviews list with only that are useful for recommendation purposes :param reviews: a list of reviews :return: a copy of the original reviews list with only that are useful for recommendation purposes """ filtered_reviews = extractor.remove_empty_user_reviews(reviews) print('Finished remove_missing_ratings_reviews') filtered_reviews = extractor.remove_users_with_low_reviews(filtered_reviews, 5) print('Finished remove_users_with_low_reviews') # filtered_reviews = extractor.remove_items_with_low_reviews(filtered_reviews, 5) # print('Finished remove_single_review_hotels') # filtered_reviews = remove_users_with_low_reviews(filtered_reviews, 10) # print('Finished remove_users_with_low_reviews') print('Number of reviews', len(filtered_reviews)) return filtered_reviews