def test_get_listens_to_fetch_top_artists(self): mapped_df = self.get_listens() from_date, to_date = candidate_sets.get_dates_to_generate_candidate_sets( mapped_df, self.recommendation_generation_window) mapped_listens_subset = candidate_sets.get_listens_to_fetch_top_artists( mapped_df, from_date, to_date) self.assertEqual(mapped_listens_subset.count(), 3)
def test_get_dates_to_generate_candidate_sets(self): mapped_df = utils.read_files_from_HDFS( RECOMMENDATION_RECORDING_MAPPED_LISTENS) from_date, to_date = candidate_sets.get_dates_to_generate_candidate_sets( mapped_df, 7) self.assertEqual(to_date, datetime(2021, 8, 9, 10, 20, 11)) self.assertEqual(from_date, datetime(2021, 8, 2))
def test_get_dates_to_generate_candidate_sets(self): mapped_df = self.get_listens() from_date, to_date = candidate_sets.get_dates_to_generate_candidate_sets( mapped_df, self.recommendation_generation_window) self.assertEqual(to_date, self.date) expected_date = stats.offset_days( self.date, self.recommendation_generation_window).replace(hour=0, minute=0, second=0) self.assertEqual(from_date, expected_date)
def test_get_listens_to_fetch_top_artists(self): self.maxDiff = None mapped_df = utils.read_files_from_HDFS( RECOMMENDATION_RECORDING_MAPPED_LISTENS) from_date, to_date = candidate_sets.get_dates_to_generate_candidate_sets( mapped_df, 7) mapped_listens_subset = candidate_sets.get_listens_to_fetch_top_artists( mapped_df, from_date, to_date) self.assertCountEqual( list(mapped_listens_subset.toLocalIterator()), list(self.mapped_listens_subset.toLocalIterator())) self.assertEqual(mapped_listens_subset.count(), 11)