def testFindDataRegions(self):
     cases = [(0,[]),
              (3,[]),
              (4,[('sky',[2,0,4])]),
              (5,[])]
     from IntelligentCrawl.config import Configuration
     Configuration.MinDataRegiontHeight = 3
     for tid,truevalue in cases:
         apple = etree.fromstring(self.xmlcode[tid])
         BasicFeatureExtraction.extractBasicStats(apple)
         print(etree.tostring(apple))
         res = PartialTreeAlignment.findDataRegions(apple, 2, 0.3)
         print(res)
         tags = [e[0].tag for e in res]
         drs = [e[1] for e in res]
         truetags = [e[0] for e in truevalue]
         truedrs = [e[1] for e in truevalue]
         self.assertListEqual(tags, truetags, tid)
         self.assertListEqual(drs, truedrs, tid)