def parse_article(self, response): item = items.PredjItem() item['title'] = response.xpath("//ul/li[2]/text()").getall() item['author'] = response.xpath("//ul/li[5]/text()").getall() item['abstract'] = response.xpath( "//li[@class='li14']/p/text()").getall() return item
def parse_article(self, response): item = items.PredjItem() item['title'] = response.xpath( "//article[@class='obj_article_details']/h1/text()").getall() item['author'] = response.xpath("//ul[@class='item authors']").getall() item['abstract'] = response.xpath( "//div[@class='main_entry']/div/text()").getall() return item
def parse_article(self, response): item = items.PredjItem() item['title'] = response.xpath( "//div[@id='articleTitle']/h5/text()").getall() item['author'] = response.xpath( "//div[@id='authorString']/h5/text()").getall() item['abstract'] = response.xpath( "//div[@id='articleAbstract']").getall() return item
def parse_article(self, response): item = items.PredjItem() item['title'] = response.xpath( "//div[@id='articleTitle']/h3/text()").get() item['author'] = response.xpath( "//div[@id='authorString']/em/text()").get() item['abstract'] = response.xpath( "//div[@id='articleAbstract']/div/text()").getall() item['year'] = response.xpath( "//div[@id='breadcrumb']/a/text()").getall() return item