Пример #1
0
 def _parseEntity(self, row, count):
     #utils.log("[%s] parsing entity %d" % (self.NAME, count))
     
     entity = Entity()
     entity.subcategory = "app"
     
     entity.factual = {
         'table' : 'iPhone_Apps.csv'
     }
     
     for srcKey, destKey in self._map.iteritems():
         if srcKey in row and row[srcKey] and len(row[srcKey]) > 0:
             entity[destKey] = row[srcKey]
     
     self._output.put(entity)
Пример #2
0
    def _parseEntity(self, row, count):
        # utils.log("[%s] parsing entity %d" % (self, count))

        name = row["name"].lower().strip()
        collapsed = False

        if name in to_collapse:
            if to_collapse[name]:
                self.numCollapsed += 1
                return

            to_collapse[name] = True
            collapsed = True

        # record how many times we've encountered each restaurant
        # if not hasattr(self, 'seen'):
        #    self.seen = {}
        # if name in self.seen:
        #    self.seen[name] += 1
        # else:
        #    self.seen[name] = 1

        entity = Entity()
        entity.subcategory = "restaurant"
        entity.factual = {"table": "US_Restaurants_V2.csv"}

        if not collapsed:
            address = FactualUtils.parseAddress(row)
            if address is not None:
                entity.address = address

        for srcKey, destKey in self._map.iteritems():
            if srcKey in row and row[srcKey]:
                entity[destKey] = row[srcKey]

        self._output.put(entity)