def get_details(self,response): hxs = HtmlXPathSelector(response) pages = hxs.select(PAGE_NAVIGATOR_az).extract() products = hxs.select(PRODUCT_NAME_az).extract() first_product_name = products[4] prices = hxs.select(PRODUCT_SELLER_PRICES_az).extract() sellers = hxs.select(PRODUCT_SELLER_NAMES_az).extract() sellers_2 = hxs.select(PRODUCT_SELLER_NAMES_az_2).extract() #print sellers cnt = 0 for i in xrange(0,len(prices)): seller = sellers[i].split('"') for j in xrange(0, len(seller)): if 'alt' in seller[j]: #print "found" sellers[i] = seller[j+1] break else: sellers[i] = sellers_2[cnt] cnt += 1 s = price_display(product_name = first_product_name, sellername = sellers[i], portalname="amazon", itemname=self.item_name, price=prices[i]) s.save() for i in xrange(1,len(pages)-1): url = BASE_URL_az + pages[i] yield Request(url, self.store_pages)
def get_details(self,response): hxs = HtmlXPathSelector(response) products = hxs.select(PRODUCT_NAME_sd).extract() first_product_name = products[0] prices = hxs.select(PRODUCT_SELLER_PRICES_sd).extract() sellers = hxs.select(PRODUCT_SELLER_NAMES_sd).extract() for i in xrange(0,len(prices)): s = price_display(product_name = first_product_name, sellername=sellers[i], portalname="snapdeal", itemname=self.item_name, price=prices[i]) s.save()
def parse(self,response): jsonresponse = json.loads(response.body_as_unicode()) #print jsonresponse #print 'len==%d'%len(jsonresponse["findItemsByKeywordsResponse"][0]["searchResult"][0]["item"]) for i in range(0,len(jsonresponse["findItemsByKeywordsResponse"][0]["searchResult"][0]["item"])): itemresponse=jsonresponse["findItemsByKeywordsResponse"][0]["searchResult"][0]["item"][i] #print "title = %s,Currency = %s Price = %s"%(itemresponse["title"][0],itemresponse["sellingStatus"][0]["currentPrice"][0]["@currencyId"],itemresponse["sellingStatus"][0]["currentPrice"][0]["__value__"]) title = itemresponse["title"][0] Price = itemresponse["sellingStatus"][0]["currentPrice"][0]["__value__"] s = price_display(product_name =title,sellername=" ", portalname="Ebay", itemname=self.item_name, price=Price) s.save()
def store_pages(self,response): hxs = HtmlXPathSelector(response) products = hxs.select(PRODUCT_NAME_az).extract() first_product_name = products[4] prices = hxs.select(PRODUCT_SELLER_PRICES_az).extract() sellers = hxs.select(PRODUCT_SELLER_NAMES_az).extract() sellers_2 = hxs.select(PRODUCT_SELLER_NAMES_az_2).extract() cnt = 0 for i in xrange(0,len(prices)): seller = sellers[i].split('"') for j in xrange(0, len(seller)): if 'alt' in seller[j]: #print "found" sellers[i] = seller[j+1] break else: sellers[i] = sellers_2[cnt] cnt += 1 s = price_display(product_name = first_product_name, sellername = sellers[i], portalname="amazon", itemname=self.item_name, price=prices[i]) s.save()