Python MycwpjtItem Examples

Programming Language: Python

Namespace/Package Name: mycwpjt.items

Class/Type: MycwpjtItem

Examples at hotexamples.com: 7

Python MycwpjtItem - 7 examples found. These are the top rated real world Python examples of mycwpjt.items.MycwpjtItem extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

MycwpjtItem(7)

Frequently Used Methods

MycwpjtItem (7)

Example #1

Show file

File: 第十六章源码.py Project: jhh130910/Book-PDF-Free

    def parse_item(self, response):
        i = MycwpjtItem()
#根据Xpath表达式提取新闻网页中的标题
        i["name"]=response.xpath("/html/head/title/text()").extract()
#根据Xpath表达式提取当前新闻网页的链接
        i["link"]=response.xpath("//link[@rel='canonical']/@href").extract()
        return i

Example #2

Show file

File: leocrawl.py Project: huoliang722/scrapyProj

 def parse_item(self, response):
     i = MycwpjtItem()
     # i['domain_id'] = response.xpath('//input[@id="sid"]/@value').extract()
     # i['name'] = response.xpath('//div[@id="name"]').extract()
     # i['description'] = response.xpath('//div[@id="description"]').extract()
     i["name"] = response.xpath("/html/head/title/text()").extract()
     i["link"] = response.xpath("//link[@rel='canonical']/@href").extract()
     return i

Example #3

Show file

File: weisuen.py Project: whyismefly/pythoncrawl

 def parse_item(self, response):
     item = MycwpjtItem()
     item["name"] = response.xpath("/html/head/title/text()").extract()
     # item = {}
     #item['domain_id'] = response.xpath('//input[@id="sid"]/@value').get()
     #item['name'] = response.xpath('//div[@id="name"]').get()
     #item['description'] = response.xpath('//div[@id="description"]').get()
     return item

Example #4

Show file

 def parse_item(self, response):
     i = MycwpjtItem()
     #i['domain_id'] = response.xpath('//input[@id="sid"]/@value').extract()
     # 根据Xpath表达式提取新闻网页中的标题
     i["name"] = response.xpath("/html/head/title/text()").extract()
     # 根据Xpath表达式提取当前新闻网页的链接
     i["link"] = response.xpath("//link[@rel='canonical']/@href").extract()
     return i

Example #5

Show file

 def parse_item(self, response):
     i = MycwpjtItem()
     # 根据XPath表达式提取新闻网页中的标题
     i['name'] = response.xpath('/html/head/title/text()').extract()
     # 根据XPath表达式提取新闻网页中的标题
     i['link'] = response.xpath('//link[@rel="canonical"]/@href').extract()
     #i['domain_id'] = response.xpath('//input[@id="sid"]/@value').extract()
     #i['name'] = response.xpath('//div[@id="name"]').extract()
     #i['description'] = response.xpath('//div[@id="description"]').extract()
     return i

Example #6

Show file

 def parse_item(self, response):
     i = MycwpjtItem()
     reload(sys)
     sys.setdefaultencoding('utf-8')
     type = sys.getfilesystemencoding()
     #i['domain_id'] = response.xpath('//input[@id="sid"]/@value').extract()
     #i['name'] = response.xpath('//div[@id="name"]').extract()
     #i['description'] = response.xpath('//div[@id="description"]').extract()
     i["name"] = response.xpath("/html/head/title/text()").extract().decode(
         'utf-8').encode(type)
     i["link"] = response.xpath("//link[@rel='canonical']/@href").extract(
     ).decode('utf-8').encode(type)
     return i

Example #7

Show file

File: weisuen.py Project: zfatgxuestc/crawler

 def parse_item(self, response):
     i = MycwpjtItem()
     i['name'] = response.xpath('/html/head/title/text()').extract()
     i['link'] = response.xpath("//link[@rel='canonical']/@href").extract()
     return i