def parse_items(self, response): hxs = HtmlXPathSelector(response) titles = hxs.select("//html") items = [] for titles in titles: item = ActivinstinctItem() item["productname"] = titles.select( "//h1[@class='black']/text()").extract() item["MRP"] = titles.select("//p[@class='blue']/text()").extract() item["SP"] = titles.select( "//p[@id='product-price']/text()").extract() item["Stock"] = titles.select( "//div[@class='notifyMe-soldout']/text()").extract() item["SKU"] = titles.select( "//div/p[@class='gray']/text()").extract() item["imgurl"] = titles.select( "//div[@id='product-image-view']/div/a/img/@src").extract() item["Description"] = titles.select( "//div[@id='hp_fix_desc']").extract() item["Size"] = titles.select( "//li/a[@class='button3']/span/text()").extract() item["category"] = titles.select( "//div[@id='breadcrumbs']/a/text()").extract() items.append(item) return (items)
def parse(self, response): hxs = HtmlXPathSelector(response) titles = hxs.select("//html") items = [] for titles in titles: item = ActivinstinctItem() item["productname"] = titles.select( "//div[@class='menu']/div[@class='c']/ul/li/a/@href").extract( ) items.append(item) return (items)