Python Utility.listToStr 예제들

프로그래밍 언어: Python

네임스페이스/패키지 이름: utility.utility

클래스/타입: Utility

메소드/함수: listToStr

hotexamples.com에서의 예제들: 5

Python Utility.listToStr - 5개의 예제가 발견되었습니다. 이것들은 오픈소스 프로젝트에서 추출된 Python의 utility.utility.Utility.listToStr에 대한 실세계 최고 등급의 예제들입니다. 예제들을 평가하여 예제의 품질 향상에 도움을 줄 수 있습니다.

자주 사용되는 메소드들

보기 숨기기

format_datetime(11)

get_nested(6)

return_json(6)

get_data_or_none(5)

decrypt(5)

listToStr(5)

encrypt(4)

return_id(4)

get_instance_fields(4)

return_instance_id(3)

load_yaml(3)

build_filter(3)

round(2)

is_file_path_safe(2)

get_device_info(2)

get_stock_listing_xlsx(2)

get_stock_price_history_file(2)

get_vendor_models(2)

save(1)

loadWorlds(1)

Utility(1)

is_config_exist(1)

get_logging_config(1)

get_device_types(1)

get_credentials(1)

get_config(1)

getPicFromUrl(1)

deleteWorld(1)

convertPicToBase64(1)

writeArticleToFile(1)

예제 #1

파일 보기

    def parse(self, response):
        ipItem = IpItem()

        proxy = response.meta['p']
        rootPath = proxy['root']
        table = response.xpath(rootPath).extract()

        for sel in Selector(response=response).xpath(rootPath):
            ipPath = proxy['ip']
            portPath = proxy['port']

            ipList = sel.xpath(ipPath).extract()
            portList = sel.xpath(portPath).extract()

            ip = Utility.listToStr(ipList)
            port = Utility.listToStr(portList)
            # using regular expression
            regex = '\d.{1,3}\d{1,3}'
            if re.match(regex, ip):
                print ip
                v = ValidateIp()
                protocol, anonymous, speed = v.validate(ip, port)
                if protocol is not -1:
                    ipItem['ip'] = ip
                    ipItem['port'] = port
                    print ipItem['ip'], ':', ipItem['port']
                    yield ipItem
                else:
                    continue
            else:
                continue

예제 #2

파일 보기

파일: accountSpider.py 프로젝트: rexbean/spider

    def parseAccount(self, response):
        urls = []

        articleListItem = ArticleListItem()
        title = response.xpath('/html/head/title//text()').extract()
        print Utility.listToStr(title)
        # account = response.xpath('//*[@class="profile_infoß"]//text()').extract()[0].strip()
        print '----------------------account-------------------------'
        for articlePath in Selector(response=response).xpath(
                '//*[@class="weui_media_box appmsg"]/div'):
            # title
            title = articlePath.xpath('./h4//text()').extract()[0].strip()
            articleListItem['title'] = title
            print articleListItem['title']
            # url
            url = articlePath.xpath('./h4//@hrefs').extract()[0]
            url = "https://mp.weixin.qq.com" + url
            articleListItem['url'] = url

            print articleListItem['url']
            # date
            date = articlePath.xpath(
                './/*[@class="weui_media_extra_info"]//text()').extract()[0]
            articleListItem['date'] = date
            print articleListItem['date']
            # abstract
            abstract = articlePath.xpath(
                './/*[@class="weui_media_desc"]//text()').extract()
            articleListItem['abstract'] = Utility.listToStr(abstract)
            print articleListItem['abstract']

        urls.append(url)
        return urls

예제 #3

파일 보기

파일: articleSpider.py 프로젝트: rexbean/spider

    def parseArticle(self, response):
        articleItem = ArticleItem()

        title = response.xpath(
            '//*[@id="activity-name"]//text()').extract()[0].strip()
        date = response.xpath('//*[@id="post-date"]//text()').extract()[0]
        author = response.xpath(
            '//*[@id="img-content"]/div[1]/em[2]').extract()
        account = response.xpath('//*[@id="post-user"]//text()').extract()[0]
        accountId = response.xpath(
            '//*[@id="js_profile_qrcode"]/div/p[1]/span//text()').extract()[0]
        content = response.xpath('//*[@id="js_content"]').extract()

        articleItem['title'] = title.encode('utf-8')
        articleItem['date'] = date.encode('utf-8')
        articleItem['account'] = account.encode('utf-8')
        articleItem['accountId'] = accountId.encode('utf-8')
        articleItem['content'] = Utility.listToStr(content).encode('utf-8')

        if len(author) > 0:
            author = author[0].encode('utf-8')
            articleItem['author'] = author
        else:
            articleItem['author'] = ''

        print articleItem['title']
        # Utility.writeArticleToFile(articleItem)
        yield articleItem

예제 #4

파일 보기

파일: articleSpider.py 프로젝트: rexbean/spider

    def parse(self, response):
        for n in range(9):
            articleListItem = ArticleListItem()
            num = self.articleListCon
            rootPath = '//*[@id="sogou_vr_' + num

            titlePath = rootPath + '_title_' + str(n) + '"]'
            contentPath = rootPath + '_summary_' + str(n) + '"]'

            title = response.xpath(titlePath + '//text()').extract()
            url = response.xpath(titlePath + '/@href').extract()[0]
            content = response.xpath(contentPath + '//text()').extract()

            articleListItem['title'] = Utility.listToStr(title)
            articleListItem['url'] = url
            articleListItem['abstract'] = Utility.listToStr(content)

            print 'title==', articleListItem['title']
            print 'href==', articleListItem['url']
            print 'content=='
            print articleListItem['abstract']

            yield scrapy.Request(url, callback=self.parseArticle)

예제 #5

파일 보기

파일: accountSpider.py 프로젝트: rexbean/spider

    def parse(self, response):
        for n in range(1):
            accountListItem = AccountListItem()
            num = self.accountListCon

            rootPath = '//*[@id="sogou_vr_' + num + '_box_' + str(n) + '"]'
            accountIdPath = './div/div[2]/p[2]/label//text()'

            txtBox = response.xpath(rootPath)
            accountId = txtBox.xpath(accountIdPath).extract()

            accountName = txtBox.xpath('./div/div[2]/p[1]/a//text()').extract()

            url = txtBox.xpath('./div/div[2]/p[1]/a/@href').extract()[0]

            accountListItem['account'] = Utility.listToStr(accountName)
            accountListItem['url'] = url
            accountListItem['accountId'] = accountId[0].encode('utf-8')

            print accountListItem['account']
            print accountListItem['url']
            print accountListItem['accountId']

            url = url.replace('http', 'https')

            cmd = "phantomjs spider/getBody.js '%s'" % url
            print url
            print cmd
            stdout, stderr = subprocess.Popen(
                cmd,
                shell=True,
                stdout=subprocess.PIPE,
                stderr=subprocess.PIPE).communicate()
            r = HtmlResponse(url=url, body=stdout)

            articleUrls = self.parseAccount(r)
            for url in articleUrls:
                yield scrapy.Request(url,
                                     callback=ArticleSpider().parseArticle)