예제 #1
0
 def findUnannotatedUpdateIds(self):
     """ 
     find out which text-updates we have already annotated in any batch.
     Update self.updateIds with the these updateIds.
     """
     textUpdateIds = pubStore.listAllUpdateIds(self.textDir)
     batchIds = self.findBatchesAtStep("annot")
     doneUpdateIds = self.getUpdateIds(batchIds)
     self.updateIds = set(textUpdateIds).difference(doneUpdateIds)
     logging.info("text: %s, done: %s" % (textUpdateIds, doneUpdateIds))
     logging.info("Text-Updates that have not been annotated yet: %s" % self.updateIds)
예제 #2
0
 def findUnannotatedUpdateIds(self):
     """ 
     find out which text-updates we have already annotated in any batch.
     Update self.updateIds with the these updateIds.
     """
     textUpdateIds = pubStore.listAllUpdateIds(self.textDir)
     batchIds = self.findBatchesAtStep("annot")
     doneUpdateIds = self.getUpdateIds(batchIds)
     self.updateIds = set(textUpdateIds).difference(doneUpdateIds)
     logging.info("text: %s, done: %s" % (textUpdateIds, doneUpdateIds))
     logging.info("Text-Updates that have not been annotated yet: %s" %
                  self.updateIds)
예제 #3
0
파일: pubMapProp.py 프로젝트: floe/pubMunch
 def updateUpdateIds(self):
     " update self.updateIds with all new updateIds in baseDir relative to textDir "
     allUpdateIds = pubStore.listAllUpdateIds(self.textDir)
     doneUpdateIds = self.getAllUpdateIds()
     self.updateIds = set(allUpdateIds).difference(doneUpdateIds)
     logging.info("Updates that have not been annotated yet: %s" % self.updateIds)