示例#1
0
    def process_item(self, item, spider):
        if not item['ISBN']:            # if item  do not have isbn then drop it
            raise DropItem('Duplicate item found: %s' % item)
        if item['platform'] == 3:       # if item is comments return to detail_pipeline
            return item

        new_book = Book()
        if item["name"]:
            new_book.title = item["name"][0]
        if item["price"]:
            new_book.price = item["price"][0]
        if item["author"]:
            new_book.author = item["author"][0]
        if item["press"]:
            new_book.press = item["press"][0]
        if item["instant"]:
            new_book.instant_price = item["instant"][0]
        if item["img"]:
            new_book.cover = item["img"][0]
        if item["description"]:
            new_book.description = item["description"][0]
        new_book.isbn = item["ISBN"][0]
        new_book.link = item["url"]
        new_book.platform = item['platform']
        #new_book.time = ?
        new_book.platform = item['platform']
        book_dao.insert(new_book)
示例#2
0
    def process_item(item, spider):
        if item['platform'] == -1:      # not a book, drop it
            return item
        if not item['ISBN']:            # not a book, drop it
            item['platform'] = -1
            return item
        if item['platform'] == 3:       # if item is comments return to detail_pipeline
            return item

        new_book = Book()
        if item["name"]:
            new_book.title = item["name"][0]
        if item["price"]:
            new_book.price = item["price"][0]
        if item["author"]:
            new_book.author = item["author"][0]
        if item["press"]:
            new_book.press = item["press"][0]
        if item["instant"]:
            new_book.instant_price = item["instant"][0]
        if item["img"]:
            new_book.cover = item["img"][0]
        if item["description"]:
            new_book.description = item["description"][0]
        new_book.isbn = item["ISBN"][0]
        new_book.link = item["url"]
        new_book.platform = item['platform']
        #new_book.time = ?
        new_book.platform = item['platform']
        book_dao.insert(new_book)
        return item
示例#3
0
 def process_item(self, item, spider):
     if(len(item['ISBN']) == 0):
         return item
     newbook = Book()
     newbook.title = item["name"][0]
     newbook.price = item["instant"][0]
     newbook.isbn = item["ISBN"][0]
     newbook.author = item["author"][0]
     newbook.press = item["press"][0]
     newbook.instant_price = item["price"][0]
     newbook.link = item["url"]
     newbook.cover = item["img"][0]
     if len(item["description"]) != 0 :
         newbook.description = item["description"][0]
     newbook.platform = item['platform']
     #newbook.time = ?
     newbook.platform = item['platform']
     book_dao.insert(newbook)
示例#4
0
 def process_item(self, item, spider):
     if item['ISBN']:
         return item
     new_book = Book()
     if item["name"]:
         new_book.title = item["name"][0]
     if item["price"]:
         new_book.price = item["price"][0]
     if item["author"]:
         new_book.author = item["author"][0]
     if item["press"]:
         new_book.press = item["press"][0]
     if item["instant"]:
         new_book.instant_price = item["instant"][0]
     if item["img"]:
         new_book.cover = item["img"][0]
     if item["description"]:
         new_book.description = item["description"][0]
     new_book.isbn = item["ISBN"][0]
     new_book.link = item["url"]
     new_book.platform = item['platform']
     #new_book.time = ?
     new_book.platform = item['platform']
     book_dao.insert(new_book)