Exemplo n.º 1
0
    def test_months_2_sameTrue(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='months',
                                    same=True)

        expected_years_set = set([2006, 2007, 2008])
        expected_months_set = set([8])
        test_2008 = pd.date_range("2008-08-01",
                                  self.date_string).astype(str).ravel()
        test_2007 = pd.date_range("2007-08-01",
                                  "2007-08-31").astype(str).ravel()
        test_2006 = pd.date_range("2006-08-01",
                                  "2006-08-31").astype(str).ravel()
        test_dates = np.hstack((np.hstack((test_2006, test_2007)), test_2008))
        test_dates_set = set(test_dates)
        test_dates_set.remove(self.date_string)

        self.assertEqual(set(test_x['Year']), expected_years_set)
        self.assertEqual(set(test_x['Month']), expected_months_set)
        self.assertEqual(set(test_x['Date']), test_dates_set)
Exemplo n.º 2
0
    def test_years_2_EdgeCase(self):
        date = pd.to_datetime("2002-08-13")

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=date,
                                    num_units=self.num_units,
                                    units='years',
                                    same=False)

        self.assertIsNone(test_x)
Exemplo n.º 3
0
    def test_days_2_sameFalse(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='days',
                                    same=False)

        test_dates_set = set(["2008-08-12", "2008-08-11"])

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 4
0
    def test_hours_15(self):
        num_units = 15

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=num_units,
                                    units='hours',
                                    same=False)

        hours_set = set([i for i in range(9, 24)])

        self.assertEqual(set(test_x['Hour'].values), hours_set)
Exemplo n.º 5
0
    def test_days_2_sameTrue(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='days',
                                    same=True)

        test_dates_set = set(['2007-08-13', '2006-08-13'])

        print(test_x.columns)

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 6
0
    def test_weeks_2_sameFalse(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='weeks',
                                    same=False)

        start = self.date + pd.Timedelta("-14 days")
        expected_dates = pd.date_range(start, self.date).astype(str).ravel()
        expected_dates = set(expected_dates[:-1])

        self.assertEqual(set(test_x['Date'].values), expected_dates)
Exemplo n.º 7
0
    def test_months_2_sameFalse(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='months',
                                    same=False)

        test_dates = pd.date_range("2008-06-13",
                                   "2008-08-13").astype(str).ravel()

        test_dates_set = set(test_dates)
        test_dates_set.remove(self.date_string)

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 8
0
    def test_years_2(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='years',
                                    same=False)

        start_date = self.date.replace(year=self.date.year - self.num_units)
        end_date = self.date + pd.Timedelta("-1 days")

        test_dates = pd.date_range(start_date, end_date).astype(str).ravel()

        test_dates_set = set(test_dates)
        print(set(test_x['Date'].values))

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 9
0
    def test_months_2_sameFalse_EdgeCase(self):

        date_string = "2013-01-15"
        date = pd.to_datetime(date_string)
        num_units = 3

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=date,
                                    num_units=num_units,
                                    units='months',
                                    same=False)

        test_dates = pd.date_range("2012-10-15",
                                   "2013-01-14").astype(str).ravel()

        test_dates_set = set(test_dates)

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 10
0
    def test_weeks_2_sameTrue(self):

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=self.date,
                                    num_units=self.num_units,
                                    units='weeks',
                                    same=True)

        test_2006 = pd.date_range("2006-08-10",
                                  "2006-08-16").astype(str).ravel()
        test_2007 = pd.date_range("2007-08-10",
                                  "2007-08-16").astype(str).ravel()
        test_2008 = pd.date_range("2008-08-10",
                                  "2008-08-12").astype(str).ravel()
        test_dates = np.hstack((np.hstack((test_2006, test_2007)), test_2008))

        test_dates_set = set(test_dates)

        self.assertEqual(set(test_x['Date'].values), test_dates_set)
Exemplo n.º 11
0
    def test_weeks_2_sameTrue_EdgeCase2(self):
        date = pd.to_datetime("2009-12-31")

        test_x, test_y = create_X_y(df=self.df,
                                    columns=self.columns,
                                    target=self.target,
                                    date=date,
                                    num_units=self.num_units,
                                    units='weeks',
                                    same=True)

        test_07_08 = pd.date_range("2007-12-28",
                                   "2008-01-03").astype(str).ravel()
        test_08_09 = pd.date_range("2008-12-28",
                                   "2009-01-03").astype(str).ravel()
        test_2009 = pd.date_range("2009-12-28",
                                  "2009-12-30").astype(str).ravel()
        test_dates = np.hstack((np.hstack(
            (test_07_08, test_08_09)), test_2009))

        test_dates_set = set(test_dates)

        self.assertEqual(set(test_x['Date'].values), test_dates_set)