def process_item(self, item, spider): # makers for maker in item['makers']: # maker makerdb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = 1, brandname = maker['makerName'], pm = maker['pm'], brandcode = maker['makerId'], parentid = 0 ) try: makerdb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % maker['makerId']) # caterory caterorydb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = 1, brandname = maker['categoryName'], pm = maker['pm'], brandcode = maker['categoryId'], parentid = maker['makerId'] ) try: caterorydb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % maker['categoryId']) for series in item['series']: # series seriesdb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = series['isValid'], brandname = series['seriesName'], brandcode = series['seriesId'], parentid = series['categoryId'] ) try: seriesdb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % series['seriesId']) return item
def process_item(self, item, spider): # makers brandinfo = item['brandinfo'] carbase = item['car'] # maker makerdb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = 1, brandname = brandinfo['makerName'], pm = brandinfo['pm'], brandcode = brandinfo['makerId'], parentid = 0 ) try: makerdb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % brandinfo['makerId']) # caterory caterorydb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = 1, brandname = brandinfo['categoryName'], pm = brandinfo['pm'], brandcode = brandinfo['categoryId'], parentid = brandinfo['makerId'] ) try: caterorydb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % brandinfo['categoryId']) seriesdb = BrandInfo(ctime = datetime.datetime.now(), mtime = datetime.datetime.now(), remark = 'crawl from haoservice', isvalid = brandinfo['isValid'], brandname = brandinfo['seriesName'], brandcode = brandinfo['seriesId'], parentid = brandinfo['categoryId'] ) try: seriesdb.save() except IntegrityError: DropItem("Contains duplicate domain: %s" % brandinfo['seriesId']) return carbase