예제 #1
0
class SupportIdentifierTestCase(unittest.TestCase):
    def setUp(self):
        sampler = T2DSampler()
        self.testTable = sampler.getTestTable()
        self.scIdentifier = SupportIdentifier()
        self.testTables = sampler.getTablesSubjectIdentificationGoldStandard()

    def testSupportIdentifier(self):
        """
           support = 0 100 | 0.327868852459
           support = 0.8 97 | 0.327868852459
           support = 0.8 30 | 0.459016393443
           support = 0.8 40 | 0.409836065574
           support = 10 70 | 0.475409836066
        """
        correctly = 0
        for tableNum, table in enumerate(self.testTables):
            supportFloor = 10
            supportCeil = 70
            subjectColumn = self.scIdentifier.identifySubjectColumn(table, supportCeil, supportFloor)
            if table.isSubjectColumn(subjectColumn):
                correctly += 1

        macroAccuracy = float(correctly) / len(self.testTables)
        print correctly
        print len(self.testTables)
        print macroAccuracy