示例#1
0
 def parse_article(self, response):
     item = items.PredjItem()
     item['title'] = response.xpath("//ul/li[2]/text()").getall()
     item['author'] = response.xpath("//ul/li[5]/text()").getall()
     item['abstract'] = response.xpath(
         "//li[@class='li14']/p/text()").getall()
     return item
 def parse_article(self, response):
     item = items.PredjItem()
     item['title'] = response.xpath(
         "//article[@class='obj_article_details']/h1/text()").getall()
     item['author'] = response.xpath("//ul[@class='item authors']").getall()
     item['abstract'] = response.xpath(
         "//div[@class='main_entry']/div/text()").getall()
     return item
 def parse_article(self, response):
     item = items.PredjItem()
     item['title'] = response.xpath(
         "//div[@id='articleTitle']/h5/text()").getall()
     item['author'] = response.xpath(
         "//div[@id='authorString']/h5/text()").getall()
     item['abstract'] = response.xpath(
         "//div[@id='articleAbstract']").getall()
     return item
示例#4
0
 def parse_article(self, response):
     item = items.PredjItem()
     item['title'] = response.xpath(
         "//div[@id='articleTitle']/h3/text()").get()
     item['author'] = response.xpath(
         "//div[@id='authorString']/em/text()").get()
     item['abstract'] = response.xpath(
         "//div[@id='articleAbstract']/div/text()").getall()
     item['year'] = response.xpath(
         "//div[@id='breadcrumb']/a/text()").getall()
     return item