예제 #1
0
def prepare_gen_hierarchies_object(dataset, numerical, categorical):
    gen_hierarchies_mine = {'categorical': {}, 'range': {}}

    # Prepare categorical attributes
    for cat_att in categorical:
        genh = CGH.CatGenHierarchy(cat_att, config.GENH_DIR + config.GENH_FILE[cat_att])
        gen_hierarchies_mine['categorical'][cat_att] = genh

    # Prepare numerical attributes
    for num_att in numerical:
        column = [dataset[idx].get(num_att) for idx in range(len(dataset))]
        min_val = min(column)
        max_val = max(column)
        print("Found " + str(num_att) + " range of: [" + str(min_val) + ":" + str(max_val) + "]")
        genh = RGH.RangeGenHierarchy(num_att, min_val, max_val)
        gen_hierarchies_mine['range'][num_att] = genh

    return gen_hierarchies_mine
예제 #2
0
 def test_catGenRaceGetGenOfWhite(self):
     cgh = CGH.CatGenHierarchy('race',
                               '../data/gen_hierarchies/RaceGH.json')
     self.assertEqual(cgh.getGeneralizationOf('White'), 'all')
예제 #3
0
 def test_catGenSexLevels(self):
     cgh = CGH.CatGenHierarchy('sex', '../data/gen_hierarchies/SexGH.json')
     self.assertEqual(cgh.nrLevels(), 1)
예제 #4
0
 def test_catGenRaceGetLevelEntryOfWhite(self):
     cgh = CGH.CatGenHierarchy('race',
                               '../data/gen_hierarchies/RaceGH.json')
     self.assertEqual(cgh.getLevelEntry('White'), 1)
예제 #5
0
 def test_catGenRaceGetNrLevels(self):
     cgh = CGH.CatGenHierarchy('race',
                               '../data/gen_hierarchies/RaceGH.json')
     self.assertEqual(cgh.nrLevels(), 1)
예제 #6
0
 def test_catGenCountryGetGenOfAsia(self):
     cgh = CGH.CatGenHierarchy(
         'native-country', '../data/gen_hierarchies/NativeCountryGH.json')
     self.assertEqual(cgh.getGeneralizationOf('Asia'), 'all')
예제 #7
0
 def test_catGenSexGetGenOfMale(self):
     cgh = CGH.CatGenHierarchy('sex', '../data/gen_hierarchies/SexGH.json')
     self.assertEqual(cgh.getGeneralizationOf('Male'), 'all')
예제 #8
0
 def test_catGenCountryLevels(self):
     cgh = CGH.CatGenHierarchy(
         'native-country', '../data/gen_hierarchies/NativeCountryGH.json')
     self.assertEqual(cgh.nrLevels(), 3)