Esempio n. 1
0
 def test_columns_heterogeneous_aggregate(self):
     columns = Columns(self.column_data, kdims=self.kdims,
                       vdims=self.vdims)
     aggregated = Columns(pd.DataFrame([('F', 10., 0.8), ('M', 16.5, 0.7)],
                                       columns=['Gender']+self.vdims),
                          kdims=self.kdims[:1], vdims=self.vdims)
     self.compare_columns(columns.aggregate(['Gender'], np.mean), aggregated)
Esempio n. 2
0
 def test_columns_2D_aggregate_partial_hm(self):
     array = np.random.rand(11, 11)
     columns = Columns({'x':self.xs, 'y':self.y_ints, 'z': array},
                       kdims=['x', 'y'], vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean),
                      Columns({'x':self.xs, 'z': np.mean(array, axis=1)},
                              kdims=['x'], vdims=['z']))
Esempio n. 3
0
 def test_columns_2D_aggregate_partial_ht(self):
     columns = Columns({
         'x': self.xs,
         'y': self.ys,
         'z': self.zs
     },
                       kdims=['x', 'y'],
                       vdims=['z'])
     reduced = Columns({
         'x': self.xs,
         'z': self.zs
     },
                       kdims=['x'],
                       vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean), reduced)
Esempio n. 4
0
 def test_columns_2D_aggregate_partial_hm(self):
     z_ints = [el**2 for el in self.y_ints]
     columns = Columns({
         'x': self.xs,
         'y': self.y_ints,
         'z': z_ints
     },
                       kdims=['x', 'y'],
                       vdims=['z'])
     self.assertEqual(
         columns.aggregate(['x'], np.mean),
         Columns({
             'x': self.xs,
             'z': z_ints
         }, kdims=['x'], vdims=['z']))
Esempio n. 5
0
 def test_columns_2d_partial_reduce(self):
     columns = Columns(pd.DataFrame({'x': self.xs, 'y': self.ys, 'z': self.zs}),
                       kdims=['x', 'y'], vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean),
                      Columns(pd.DataFrame({'x': self.xs, 'z': self.zs}),
                              kdims=['x'], vdims=['z']))
Esempio n. 6
0
 def test_columns_2d_aggregate_partial(self):
     columns = Columns((self.xs, self.ys, self.zs), kdims=['x', 'y'], vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean),
                      Columns((self.xs, self.zs), kdims=['x'], vdims=['z']))
Esempio n. 7
0
 def test_column_heterogeneous_aggregate(self):
     columns = Columns(zip(self.keys1, self.values1), kdims=self.kdims,
                       vdims=self.vdims)
     aggregated = Columns(OrderedDict([('M', (16.5, 0.7)), ('F', (10., 0.8))]),
                          kdims=self.kdims[:1], vdims=self.vdims)
     self.compare_columns(columns.aggregate(['Gender'], np.mean), aggregated)
Esempio n. 8
0
 def test_columns_2D_aggregate_partial_ht(self):
     columns = Columns({'x':self.xs, 'y':self.ys, 'z':self.zs},
                       kdims=['x', 'y'], vdims=['z'])
     reduced = Columns({'x':self.xs, 'z':self.zs},
                       kdims=['x'], vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean), reduced)
Esempio n. 9
0
class HeterogeneousColumnTypes(HomogeneousColumnTypes):
    """
    Tests for data formats that all columns to have varied types
    """

    def init_data(self):
        self.kdims = ['Gender', 'Age']
        self.vdims = ['Weight', 'Height']
        self.gender, self.age = ['M','M','F'], [10,16,12]
        self.weight, self.height = [15,18,10], [0.8,0.6,0.8]
        self.table = Columns({'Gender':self.gender, 'Age':self.age,
                              'Weight':self.weight, 'Height':self.height},
                             kdims=self.kdims, vdims=self.vdims)

        super(HeterogeneousColumnTypes, self).init_data()
        self.ys = np.linspace(0, 1, 11)
        self.zs = np.sin(self.xs)
        self.columns_ht = Columns({'x':self.xs, 'y':self.ys},
                                  kdims=['x'], vdims=['y'])

    # Test the constructor to be supported by all interfaces supporting
    # heterogeneous column types.

    def test_columns_ndelement_init_ht(self):
        "Tests support for heterogeneous NdElement (backwards compatibility)"
        columns = Columns(NdElement(zip(self.xs, self.ys), kdims=['x'], vdims=['y']))
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_dataframe_init_ht(self):
        "Tests support for heterogeneous DataFrames"
        if pd is None:
            raise SkipTest("Pandas not available")
        columns = Columns(pd.DataFrame({'x':self.xs, 'y':self.ys}), kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    # Test literal formats

    def test_columns_uniq_dimvals_ht(self):
        self.assertEqual(self.table.dimension_values('Gender', unique=True),
                         np.array(['M', 'F']))

    def test_columns_implicit_indexing_init(self):
        columns = Columns(self.ys, kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_tuple_init(self):
        columns = Columns((self.xs, self.ys), kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_simple_zip_init(self):
        columns = Columns(zip(self.xs, self.ys), kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_zip_init(self):
        columns = Columns(zip(self.gender, self.age,
                              self.weight, self.height),
                          kdims=self.kdims, vdims=self.vdims)
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_odict_init(self):
        columns = Columns(OrderedDict(zip(self.xs, self.ys)), kdims=['A'], vdims=['B'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_dict_init(self):
        columns = Columns(dict(zip(self.xs, self.ys)), kdims=['A'], vdims=['B'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    # Operations

    def test_columns_sort_vdim_ht(self):
        columns = Columns({'x':self.xs, 'y':-self.ys},
                          kdims=['x'], vdims=['y'])
        columns_sorted = Columns({'x':self.xs[::-1], 'y':-self.ys[::-1]},
                                 kdims=['x'], vdims=['y'])
        self.assertEqual(columns.sort('y'), columns_sorted)

    def test_columns_sort_string_ht(self):
        columns_sorted = Columns({'Gender':['F','M','M'], 'Age':[12,10,16],
                                  'Weight':[10,15,18], 'Height':[0.8,0.8,0.6]},
                                 kdims=self.kdims, vdims=self.vdims)
        self.assertEqual(self.table.sort(), columns_sorted)

    def test_columns_sample_ht(self):
        samples = self.columns_ht.sample([0, 5, 10]).dimension_values('y')
        self.assertEqual(samples, np.array([0, 0.5, 1]))

    def test_columns_reduce_ht(self):
        reduced = Columns({'Age':self.age, 'Weight':self.weight, 'Height':self.height},
                          kdims=self.kdims[1:], vdims=self.vdims)
        self.assertEqual(self.table.reduce(['Gender'], np.mean), reduced)

    def test_columns_1D_reduce_ht(self):
        self.assertEqual(self.columns_ht.reduce('x', np.mean), np.float64(0.5))

    def test_columns_2D_reduce_ht(self):
        reduced = Columns({'Weight':[14.333333333333334], 'Height':[0.73333333333333339]},
                          kdims=[], vdims=self.vdims)
        self.assertEqual(self.table.reduce(function=np.mean), reduced)

    def test_columns_2D_partial_reduce_ht(self):
        columns = Columns({'x':self.xs, 'y':self.ys, 'z':self.zs},
                          kdims=['x', 'y'], vdims=['z'])
        reduced = Columns({'x':self.xs, 'z':self.zs},
                          kdims=['x'], vdims=['z'])
        self.assertEqual(columns.reduce(['y'], np.mean), reduced)

    def test_column_aggregate_ht(self):
        aggregated = Columns({'Gender':['M','F'], 'Weight':[16.5,10], 'Height':[0.7,0.8]},
                             kdims=self.kdims[:1], vdims=self.vdims)
        self.compare_columns(self.table.aggregate(['Gender'], np.mean), aggregated)

    def test_columns_2D_aggregate_partial_ht(self):
        columns = Columns({'x':self.xs, 'y':self.ys, 'z':self.zs},
                          kdims=['x', 'y'], vdims=['z'])
        reduced = Columns({'x':self.xs, 'z':self.zs},
                          kdims=['x'], vdims=['z'])
        self.assertEqual(columns.aggregate(['x'], np.mean), reduced)


    def test_columns_groupby(self):
        group1 = {'Age':[10,16], 'Weight':[15,18], 'Height':[0.8,0.6]}
        group2 = {'Age':[12], 'Weight':[10], 'Height':[0.8]}
        with sorted_context(False):
            grouped = HoloMap([('M', Columns(group1, kdims=['Age'], vdims=self.vdims)),
                               ('F', Columns(group2, kdims=['Age'], vdims=self.vdims))],
                              kdims=['Gender'])
        self.assertEqual(self.table.groupby(['Gender']), grouped)


    def test_columns_add_dimensions_value_ht(self):
        table = self.columns_ht.add_dimension('z', 1, 0)
        self.assertEqual(table.kdims[1], 'z')
        self.compare_arrays(table.dimension_values('z'), np.zeros(len(table)))

    def test_columns_add_dimensions_values_ht(self):
        table = self.columns_ht.add_dimension('z', 1, range(1,12))
        self.assertEqual(table.kdims[1], 'z')
        self.compare_arrays(table.dimension_values('z'), np.array(list(range(1,12))))

    # Indexing

    def test_columns_index_row_gender_female(self):
        indexed = Columns({'Gender':['F'],'Age':[12],
                           'Weight':[10], 'Height':[0.8]},
                          kdims=self.kdims, vdims=self.vdims)
        row = self.table['F',:]
        self.assertEquals(row, indexed)

    def test_columns_index_rows_gender_male(self):
        row = self.table['M',:]
        indexed = Columns({'Gender':['M','M'],'Age':[10,16],
                           'Weight':[15,18], 'Height':[0.8,0.6]},
                          kdims=self.kdims, vdims=self.vdims)
        self.assertEquals(row, indexed)

    def test_columns_index_row_age(self):
        indexed = Columns({'Gender':['F'],'Age':[12],
                           'Weight':[10], 'Height':[0.8]},
                          kdims=self.kdims, vdims=self.vdims)
        self.assertEquals(self.table[:, 12], indexed)

    def test_columns_index_item_table(self):
        indexed = Columns({'Gender':['F'],'Age':[12],
                           'Weight':[10], 'Height':[0.8]},
                          kdims=self.kdims, vdims=self.vdims)
        self.assertEquals(self.table['F', 12], indexed)

    def test_columns_index_value1(self):
        self.assertEquals(self.table['F', 12, 'Weight'], 10)

    def test_columns_index_value2(self):
        self.assertEquals(self.table['F', 12, 'Height'], 0.8)

    def test_columns_index_column_ht(self):
        self.compare_arrays(self.columns_ht['y'], self.ys)

    def test_columns_boolean_index(self):
        row = self.table[np.array([True, True, False])]
        indexed = Columns({'Gender':['M','M'],'Age':[10,16],
                           'Weight':[15,18], 'Height':[0.8,0.6]},
                          kdims=self.kdims, vdims=self.vdims)
        self.assertEquals(row, indexed)

    def test_columns_value_dim_index(self):
        row = self.table[:, :, 'Weight']
        indexed = Columns({'Gender':['M','M','F'],'Age':[10,16, 12],
                           'Weight':[15,18, 10]},
                          kdims=self.kdims, vdims=self.vdims[:1])
        self.assertEquals(row, indexed)

    def test_columns_value_dim_scalar_index(self):
        row = self.table['M', 10, 'Weight']
        self.assertEquals(row, 15)

    # Casting

    def test_columns_array_ht(self):
        self.assertEqual(self.columns_ht.array(),
                         np.column_stack([self.xs, self.ys]))
Esempio n. 10
0
 def test_columns_2D_aggregate_partial_hm(self):
     z_ints = [el**2 for el in self.y_ints]
     columns = Columns({'x':self.xs, 'y':self.y_ints, 'z':z_ints},
                       kdims=['x', 'y'], vdims=['z'])
     self.assertEqual(columns.aggregate(['x'], np.mean),
                      Columns({'x':self.xs, 'z':z_ints}, kdims=['x'], vdims=['z']))
Esempio n. 11
0
class HeterogeneousColumnTypes(HomogeneousColumnTypes):
    """
    Tests for data formats that all columns to have varied types
    """
    def init_data(self):
        self.kdims = ['Gender', 'Age']
        self.vdims = ['Weight', 'Height']
        self.gender, self.age = ['M', 'M', 'F'], [10, 16, 12]
        self.weight, self.height = [15, 18, 10], [0.8, 0.6, 0.8]
        self.table = Columns(
            {
                'Gender': self.gender,
                'Age': self.age,
                'Weight': self.weight,
                'Height': self.height
            },
            kdims=self.kdims,
            vdims=self.vdims)

        super(HeterogeneousColumnTypes, self).init_data()
        self.ys = np.linspace(0, 1, 11)
        self.zs = np.sin(self.xs)
        self.columns_ht = Columns({
            'x': self.xs,
            'y': self.ys
        },
                                  kdims=['x'],
                                  vdims=['y'])

    # Test the constructor to be supported by all interfaces supporting
    # heterogeneous column types.

    def test_columns_ndelement_init_ht(self):
        "Tests support for heterogeneous NdElement (backwards compatibility)"
        columns = Columns(
            NdElement(zip(self.xs, self.ys), kdims=['x'], vdims=['y']))
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_dataframe_init_ht(self):
        "Tests support for heterogeneous DataFrames"
        if pd is None:
            raise SkipTest("Pandas not available")
        columns = Columns(pd.DataFrame({
            'x': self.xs,
            'y': self.ys
        }),
                          kdims=['x'],
                          vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    # Test literal formats

    def test_columns_implicit_indexing_init(self):
        columns = Columns(self.ys, kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_tuple_init(self):
        columns = Columns((self.xs, self.ys), kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_simple_zip_init(self):
        columns = Columns(zip(self.xs, self.ys), kdims=['x'], vdims=['y'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_zip_init(self):
        columns = Columns(zip(self.gender, self.age, self.weight, self.height),
                          kdims=self.kdims,
                          vdims=self.vdims)
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_odict_init(self):
        columns = Columns(OrderedDict(zip(self.xs, self.ys)),
                          kdims=['A'],
                          vdims=['B'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    def test_columns_dict_init(self):
        columns = Columns(dict(zip(self.xs, self.ys)),
                          kdims=['A'],
                          vdims=['B'])
        self.assertTrue(isinstance(columns.data, self.data_instance_type))

    # Operations

    def test_columns_sort_vdim_ht(self):
        columns = Columns({
            'x': self.xs,
            'y': -self.ys
        },
                          kdims=['x'],
                          vdims=['y'])
        columns_sorted = Columns({
            'x': self.xs[::-1],
            'y': -self.ys[::-1]
        },
                                 kdims=['x'],
                                 vdims=['y'])
        self.assertEqual(columns.sort('y'), columns_sorted)

    def test_columns_sort_string_ht(self):
        columns_sorted = Columns(
            {
                'Gender': ['F', 'M', 'M'],
                'Age': [12, 10, 16],
                'Weight': [10, 15, 18],
                'Height': [0.8, 0.8, 0.6]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        self.assertEqual(self.table.sort(), columns_sorted)

    def test_columns_sample_ht(self):
        samples = self.columns_ht.sample([0, 5, 10]).dimension_values('y')
        self.assertEqual(samples, np.array([0, 0.5, 1]))

    def test_columns_reduce_ht(self):
        reduced = Columns(
            {
                'Age': self.age,
                'Weight': self.weight,
                'Height': self.height
            },
            kdims=self.kdims[1:],
            vdims=self.vdims)
        self.assertEqual(self.table.reduce(['Gender'], np.mean), reduced)

    def test_columns_1D_reduce_ht(self):
        self.assertEqual(self.columns_ht.reduce('x', np.mean), np.float64(0.5))

    def test_columns_2D_reduce_ht(self):
        reduced = Columns(
            {
                'Weight': [14.333333333333334],
                'Height': [0.73333333333333339]
            },
            kdims=[],
            vdims=self.vdims)
        self.assertEqual(self.table.reduce(function=np.mean), reduced)

    def test_columns_2D_partial_reduce_ht(self):
        columns = Columns({
            'x': self.xs,
            'y': self.ys,
            'z': self.zs
        },
                          kdims=['x', 'y'],
                          vdims=['z'])
        reduced = Columns({
            'x': self.xs,
            'z': self.zs
        },
                          kdims=['x'],
                          vdims=['z'])
        self.assertEqual(columns.reduce(['y'], np.mean), reduced)

    def test_column_aggregate_ht(self):
        aggregated = Columns(
            {
                'Gender': ['M', 'F'],
                'Weight': [16.5, 10],
                'Height': [0.7, 0.8]
            },
            kdims=self.kdims[:1],
            vdims=self.vdims)
        self.compare_columns(self.table.aggregate(['Gender'], np.mean),
                             aggregated)

    def test_columns_2D_aggregate_partial_ht(self):
        columns = Columns({
            'x': self.xs,
            'y': self.ys,
            'z': self.zs
        },
                          kdims=['x', 'y'],
                          vdims=['z'])
        reduced = Columns({
            'x': self.xs,
            'z': self.zs
        },
                          kdims=['x'],
                          vdims=['z'])
        self.assertEqual(columns.aggregate(['x'], np.mean), reduced)

    def test_columns_groupby(self):
        group1 = {'Age': [10, 16], 'Weight': [15, 18], 'Height': [0.8, 0.6]}
        group2 = {'Age': [12], 'Weight': [10], 'Height': [0.8]}
        with sorted_context(False):
            grouped = HoloMap(
                [('M', Columns(group1, kdims=['Age'], vdims=self.vdims)),
                 ('F', Columns(group2, kdims=['Age'], vdims=self.vdims))],
                kdims=['Gender'])
        self.assertEqual(self.table.groupby(['Gender']), grouped)

    def test_columns_add_dimensions_value_ht(self):
        table = self.columns_ht.add_dimension('z', 1, 0)
        self.assertEqual(table.kdims[1], 'z')
        self.compare_arrays(table.dimension_values('z'), np.zeros(len(table)))

    def test_columns_add_dimensions_values_ht(self):
        table = self.columns_ht.add_dimension('z', 1, range(1, 12))
        self.assertEqual(table.kdims[1], 'z')
        self.compare_arrays(table.dimension_values('z'),
                            np.array(list(range(1, 12))))

    # Indexing

    def test_columns_index_row_gender_female(self):
        indexed = Columns(
            {
                'Gender': ['F'],
                'Age': [12],
                'Weight': [10],
                'Height': [0.8]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        row = self.table['F', :]
        self.assertEquals(row, indexed)

    def test_columns_index_rows_gender_male(self):
        row = self.table['M', :]
        indexed = Columns(
            {
                'Gender': ['M', 'M'],
                'Age': [10, 16],
                'Weight': [15, 18],
                'Height': [0.8, 0.6]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        self.assertEquals(row, indexed)

    def test_columns_index_row_age(self):
        indexed = Columns(
            {
                'Gender': ['F'],
                'Age': [12],
                'Weight': [10],
                'Height': [0.8]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        self.assertEquals(self.table[:, 12], indexed)

    def test_columns_index_item_table(self):
        indexed = Columns(
            {
                'Gender': ['F'],
                'Age': [12],
                'Weight': [10],
                'Height': [0.8]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        self.assertEquals(self.table['F', 12], indexed)

    def test_columns_index_value1(self):
        self.assertEquals(self.table['F', 12, 'Weight'], 10)

    def test_columns_index_value2(self):
        self.assertEquals(self.table['F', 12, 'Height'], 0.8)

    def test_columns_index_column_ht(self):
        self.compare_arrays(self.columns_ht['y'], self.ys)

    def test_columns_boolean_index(self):
        row = self.table[np.array([True, True, False])]
        indexed = Columns(
            {
                'Gender': ['M', 'M'],
                'Age': [10, 16],
                'Weight': [15, 18],
                'Height': [0.8, 0.6]
            },
            kdims=self.kdims,
            vdims=self.vdims)
        self.assertEquals(row, indexed)

    def test_columns_value_dim_index(self):
        row = self.table[:, :, 'Weight']
        indexed = Columns(
            {
                'Gender': ['M', 'M', 'F'],
                'Age': [10, 16, 12],
                'Weight': [15, 18, 10]
            },
            kdims=self.kdims,
            vdims=self.vdims[:1])
        self.assertEquals(row, indexed)

    def test_columns_value_dim_scalar_index(self):
        row = self.table['M', 10, 'Weight']
        self.assertEquals(row, 15)

    # Casting

    def test_columns_array_ht(self):
        self.assertEqual(self.columns_ht.array(),
                         np.column_stack([self.xs, self.ys]))