Example #1
0
    def process_item(self, item, spider):
        # makers
        for maker in item['makers']:
            # maker
            makerdb = BrandInfo(ctime = datetime.datetime.now(),
                mtime = datetime.datetime.now(),
                remark = 'crawl from haoservice',
                isvalid = 1,
                brandname = maker['makerName'],
                pm = maker['pm'],
                brandcode = maker['makerId'],
                parentid = 0
                )
            try:
                makerdb.save()
            except IntegrityError:
              DropItem("Contains duplicate domain: %s" % maker['makerId'])
            # caterory
            caterorydb = BrandInfo(ctime = datetime.datetime.now(),
                mtime = datetime.datetime.now(),
                remark = 'crawl from haoservice',
                isvalid = 1,
                brandname = maker['categoryName'],
                pm = maker['pm'],
                brandcode = maker['categoryId'],
                parentid = maker['makerId']
                )
            try:
                caterorydb.save()
            except IntegrityError:
              DropItem("Contains duplicate domain: %s" % maker['categoryId'])

        for series in item['series']:
          # series
            seriesdb = BrandInfo(ctime = datetime.datetime.now(),
                mtime = datetime.datetime.now(),
                remark = 'crawl from haoservice',
                isvalid = series['isValid'],
                brandname = series['seriesName'],
                brandcode = series['seriesId'],
                parentid = series['categoryId']
                )
            try:
                seriesdb.save()
            except IntegrityError:
              DropItem("Contains duplicate domain: %s" % series['seriesId'])

        return item
Example #2
0
    def process_item(self, item, spider):
        # makers
        brandinfo = item['brandinfo']
        carbase = item['car']      
        # maker
        makerdb = BrandInfo(ctime = datetime.datetime.now(),
            mtime = datetime.datetime.now(),
            remark = 'crawl from haoservice',
            isvalid = 1,
            brandname = brandinfo['makerName'],
            pm = brandinfo['pm'],
            brandcode = brandinfo['makerId'],
            parentid = 0
            )
        try:
            makerdb.save()
        except IntegrityError:
            DropItem("Contains duplicate domain: %s" % brandinfo['makerId'])

        # caterory
        caterorydb = BrandInfo(ctime = datetime.datetime.now(),
            mtime = datetime.datetime.now(),
            remark = 'crawl from haoservice',
            isvalid = 1,
            brandname = brandinfo['categoryName'],
            pm = brandinfo['pm'],
            brandcode = brandinfo['categoryId'],
            parentid = brandinfo['makerId']
            )
        try:
            caterorydb.save()
        except IntegrityError:
            DropItem("Contains duplicate domain: %s" % brandinfo['categoryId'])

        seriesdb = BrandInfo(ctime = datetime.datetime.now(),
            mtime = datetime.datetime.now(),
            remark = 'crawl from haoservice',
            isvalid = brandinfo['isValid'],
            brandname = brandinfo['seriesName'],
            brandcode = brandinfo['seriesId'],
            parentid = brandinfo['categoryId']
            )
        try:
            seriesdb.save()
        except IntegrityError:
            DropItem("Contains duplicate domain: %s" % brandinfo['seriesId'])
        return carbase